Key driver analysis to yield clues into **potential** causal relationships in your data by determining variables with high predictive power, high correlation with outcome, etc.
import pandas as pd
df = pd.read_csv('sample_data/houses.csv')
from causalnlp.key_driver_analysis import KeyDriverAnalysis
kda = KeyDriverAnalysis(df, outcome_col='SalePrice', ignore_cols=['Id', 'YearSold'])
df_results = kda.correlations()
df_results.head()
assert df_results.iloc[[0]].index.values[0] == 'OverallQual'
df_results = kda.importances()
df_results.head()
import pandas as pd
df = pd.read_csv('sample_data/adult-census.csv')
kda = KeyDriverAnalysis(df, outcome_col='class', ignore_cols=['fnlwgt'])
df_results = kda.importances(use_shap=True, plot=True)
df_results.head()