fix(ml): parse datetime column and fix TA-Lib pattern names

- Add parse_dates parameter when loading enriched CSV - Strip timezone from annotation timestamps to match data - Fix pattern names: CDLTHREEWHITESOLDIERS -> CDL3WHITESOLDIERS - Fix pattern names: CDLTHREEBLACKCROWS -> CDL3BLACKCROWS
2026-02-15 21:13:20 +01:00 · 2026-02-15 21:13:20 +01:00 · ceb4103ec4
commit ceb4103ec4
parent 2b86524436
10 changed files with 5 additions and 5 deletions
--- a/services/ml/app/pycache/annotation_ingestion.cpython-313.pyc
+++ b/services/ml/app/pycache/annotation_ingestion.cpython-313.pyc
--- a/services/ml/app/pycache/db.cpython-313.pyc
+++ b/services/ml/app/pycache/db.cpython-313.pyc
--- a/services/ml/app/annotation_ingestion.py
+++ b/services/ml/app/annotation_ingestion.py
@ -188,8 +188,8 @@ class AnnotationIngestion:
        for ann in annotations:
            label = ann['label']
-            start_time = pd.Timestamp(ann['start_time'])
+            start_time = pd.Timestamp(ann['start_time']).tz_localize(None)
-            end_time = pd.Timestamp(ann['end_time'])
+            end_time = pd.Timestamp(ann['end_time']).tz_localize(None)
            # Find candles in span
            span_mask = (df['time'] >= start_time) & (df['time'] <= end_time)
@ -504,7 +504,7 @@ def run_annotation_ingestion(
    logger.info("Running annotation ingestion stage")
    # Load enriched data
-    enriched_df = pd.read_csv(enriched_path)
+    enriched_df = pd.read_csv(enriched_path, parse_dates=['time'])
    logger.info(f"Loaded enriched data: {enriched_df.shape}")
    # Process annotations
--- a/services/ml/config/pipeline.yaml
+++ b/services/ml/config/pipeline.yaml
@ -86,8 +86,8 @@ stages:
        - "CDLHARAMI"
        - "CDLPIERCING"
        - "CDLDARKCLOUDCOVER"
-        - "CDLTHREEWHITESOLDIERS"
+        - "CDL3WHITESOLDIERS"
-        - "CDLTHREEBLACKCROWS"
+        - "CDL3BLACKCROWS"
    # Label merge strategy: "human_priority", "programmatic_priority", "both"
    merge_strategy: "human_priority"
--- a/services/ml/training/pycache/init.cpython-313.pyc
+++ b/services/ml/training/pycache/init.cpython-313.pyc
--- a/services/ml/training/pycache/evaluation.cpython-313.pyc
+++ b/services/ml/training/pycache/evaluation.cpython-313.pyc
--- a/services/ml/training/pycache/train.cpython-313.pyc
+++ b/services/ml/training/pycache/train.cpython-313.pyc
--- a/services/ml/training/models/pycache/init.cpython-313.pyc
+++ b/services/ml/training/models/pycache/init.cpython-313.pyc
--- a/services/ml/training/models/pycache/random_forest.cpython-313.pyc
+++ b/services/ml/training/models/pycache/random_forest.cpython-313.pyc
--- a/services/ml/training/models/pycache/xgboost_model.cpython-313.pyc
+++ b/services/ml/training/models/pycache/xgboost_model.cpython-313.pyc