fix a bug in the result storing of factor costeer

microsoft · WinstonLiyt · Nov 25, 2024 · Nov 25, 2024 · Nov 25, 2024 · Nov 25, 2024
commit de4d413feff26011a3c4c6e15d65bb96b05e94f1
diff --git a/rdagent/components/coder/factor_coder/factor.py b/rdagent/components/coder/factor_coder/factor.py
@@ -147,7 +147,10 @@ def execute(self, data_type: str = "Debug") -> Tuple[str, pd.DataFrame]:
                 execution_code_path = code_path
             elif self.target_task.version == 2:
                 execution_code_path = self.workspace_path / f"{uuid.uuid4()}.py"
-                execution_code_path.write_text((Path(__file__).parent / "factor_execution_template.txt").read_text())
+                if KAGGLE_IMPLEMENT_SETTING.template_path == "rdagent/scenarios/kaggle/tpl_ex":
+                    execution_code_path.write_text((Path(__file__).parent / "factor_execution_template_v2.txt").read_text())
+                else:
+                    execution_code_path.write_text((Path(__file__).parent / "factor_execution_template_v1.txt").read_text())
 
             try:
                 subprocess.check_output(

diff --git a/...actor_coder/factor_execution_template.txt → ...or_coder/factor_execution_template_v1.txt b/...actor_coder/factor_execution_template.txt → ...or_coder/factor_execution_template_v1.txt
diff --git a/rdagent/components/coder/factor_coder/factor_execution_template_v2.txt b/rdagent/components/coder/factor_coder/factor_execution_template_v2.txt
@@ -0,0 +1,16 @@
+import os
+import h5py
+import numpy as np
+import pandas as pd
+from feat01 import feat_eng
+
+if os.path.exists("X.pkl"):
+    X = pd.read_pickle("X.pkl")
+    y = pd.read_pickle("y.pkl")
+else:
+    raise FileNotFoundError("No valid data found.")
+
+X, y, p = feat_eng(X, y)
+
+with h5py.File('result.h5', 'w') as hf:
+    hf.create_dataset('default', data=X)