fix: escape csv field to avoid error on empty fields

This commit is contained in:
2025-08-17 13:39:19 +02:00
parent ed60f9deff
commit 3122c92f5e
4 changed files with 15 additions and 9 deletions
+2 -4
View File
@@ -8,6 +8,7 @@ from typing import Dict, Any, List, Tuple
import spacy
from spacy.training import Example
from spacy.util import minibatch
from tqdm import tqdm
from core.config.pipeline_config import PipelineConfig
@@ -198,13 +199,10 @@ class NameModel:
# Create training examples
examples = []
for text, annotations in data:
for text, annotations in tqdm(data, description="Create training examples"):
doc = self.nlp.make_doc(text)
example = Example.from_dict(doc, annotations)
examples.append(example)
logging.info(
f"Training example: {text[:30]} with entities {annotations.get('entities', [])}"
)
# Train in batches
batches = minibatch(examples, size=batch_size)