chagu13
/

is_click_predictor

KaiquanMah commited on Feb 15, 2025

Commit

f5755a2

verified ·

1 Parent(s): b0bc543

Yair - Fixed CatBoost. Works with cat_features

Files changed (1) hide show

model_predictor.py CHANGED Viewed

@@ -1,9 +1,24 @@
 import numpy as np
 import pandas as pd
 def predict(models, X_test):
     """ Make predictions using trained models """
-    test_predictions = {name: np.array(model.predict(X_test)).squeeze() for name, model in models.items()}
     test_predictions_df = pd.DataFrame(test_predictions)
@@ -15,3 +30,4 @@ def predict(models, X_test):
     test_predictions_df["is_click_predicted"] = test_predictions_df.max(axis=1)
     return test_predictions_df

 import numpy as np
 import pandas as pd
+from catboost import Pool
+from data_loader import CATEGORICAL_COLUMNS, IDS_COLUMNS, TARGET_COLUMN, FEATURE_COLUMNS, AGGREGATED_COLUMNS, TEMPORAL_COLUMNS
 def predict(models, X_test):
     """ Make predictions using trained models """
+    # Ensure categorical features are properly handled
+    cat_features =  CATEGORICAL_COLUMNS
+    test_predictions = {}
+    #
+    # test_predictions = {name: np.array(model.predict(X_test)).squeeze() for name, model in models.items()}
+    for name, model in models.items():
+        if "CatBoost" in name:  # Handle CatBoost models
+            pool = Pool(data=X_test, cat_features=cat_features)
+            test_predictions[name] = model.predict(pool)
+        else:  # Other models
+            # reordering columns to match the order of columns in the model
+            new_X_test = X_test[IDS_COLUMNS + FEATURE_COLUMNS + AGGREGATED_COLUMNS + TEMPORAL_COLUMNS]
+            test_predictions[name] = np.array(model.predict(new_X_test)).squeeze()
     test_predictions_df = pd.DataFrame(test_predictions)
     test_predictions_df["is_click_predicted"] = test_predictions_df.max(axis=1)
     return test_predictions_df