refactor: clean up imports and improve gender normalization method

This commit is contained in:
2025-09-20 22:55:24 +02:00
parent 0816207a2c
commit dd2a9f2711
5 changed files with 226 additions and 82 deletions
+1 -1
View File
@@ -9,7 +9,7 @@ import pandas as pd
from pydantic import BaseModel
from core.config.pipeline_config import PipelineConfig
from core.utils.data_loader import OPTIMIZED_DTYPES, DataLoader
from core.utils.data_loader import DataLoader
from processing.batch.batch_config import BatchConfig
+2 -1
View File
@@ -150,7 +150,8 @@ class FeatureExtractionStep(PipelineStep):
except Exception as e:
logging.warning(f"NER tagging failed for row {idx}: {e}")
def _normalize_gender(self, series: pd.Series) -> pd.Series:
@classmethod
def _normalize_gender(cls, series: pd.Series) -> pd.Series:
gender_mapping = {
"m": "m",
"male": "m",