vif: Allow computing VIF only for variables in the formula
This commit is contained in:
parent
461e00df78
commit
bb534cb285
@ -28,8 +28,16 @@ import itertools
|
|||||||
|
|
||||||
from .utils import Estimate, check_nan, fmt_p_html, fmt_p_text
|
from .utils import Estimate, check_nan, fmt_p_html, fmt_p_text
|
||||||
|
|
||||||
def vif(df, nan_policy='warn'):
|
def vif(df, formula=None, nan_policy='warn'):
|
||||||
"""Calculate the variance inflation factor for each variable in df"""
|
"""
|
||||||
|
Calculate the variance inflation factor for each variable in df
|
||||||
|
|
||||||
|
formula: If specified, calculate the VIF only for the variables in the formula
|
||||||
|
"""
|
||||||
|
|
||||||
|
if formula:
|
||||||
|
# Only consider columns in the formula
|
||||||
|
df = df[cols_for_formula(formula)]
|
||||||
|
|
||||||
# Check for/clean NaNs
|
# Check for/clean NaNs
|
||||||
df = check_nan(df, nan_policy)
|
df = check_nan(df, nan_policy)
|
||||||
|
Loading…
Reference in New Issue
Block a user