Skip to content

Commit db57984

Browse files
committed
add OCR regex to detect Nutri-Score v2 through Nouveau calcul text
1 parent 1e5761f commit db57984

2 files changed

Lines changed: 26 additions & 0 deletions

File tree

robotoff/prediction/ocr/label.py

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -95,6 +95,17 @@ def process_es_bio_label_code(match) -> str:
9595
"en:nutriscore": [
9696
OCRRegex(re.compile(r"NUTRI-SCORE"), field=OCRField.full_text),
9797
],
98+
"en:nutriscore-v2": [
99+
OCRRegex(
100+
re.compile(
101+
r"nouveau calcul|new calculation|neue berechnung|nuevo c[áa]lculo|"
102+
r"nuovo calcolo|nieuwe berekening|novo c[áa]lculo|ny beregning|"
103+
r"uusi laskenta|novi izra[čc]un|ново изчисление",
104+
re.I,
105+
),
106+
field=OCRField.full_text_contiguous,
107+
),
108+
],
98109
"en:eu-non-eu-agriculture": [
99110
OCRRegex(
100111
re.compile(

tests/unit/prediction/ocr/test_label.py

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,6 +32,21 @@ def test_es_ocr_regex(input_str: str, is_match: bool, output: str | None):
3232
("homologation LA 42/05", ["fr:label-rouge"]),
3333
("Homologation n°LA19/05", ["fr:label-rouge"]),
3434
("Homologation n°LA 02/91", ["fr:label-rouge"]),
35+
("Nouveau calcul", ["en:nutriscore-v2"]),
36+
("NOUVEAU CALCUL", ["en:nutriscore-v2"]),
37+
("nouveau calcul", ["en:nutriscore-v2"]),
38+
("New calculation", ["en:nutriscore-v2"]),
39+
("Neue Berechnung", ["en:nutriscore-v2"]),
40+
("Nuevo cálculo", ["en:nutriscore-v2"]),
41+
("Nuevo calculo", ["en:nutriscore-v2"]),
42+
("Nuovo calcolo", ["en:nutriscore-v2"]),
43+
("Nieuwe berekening", ["en:nutriscore-v2"]),
44+
("Novo cálculo", ["en:nutriscore-v2"]),
45+
("Ny beregning", ["en:nutriscore-v2"]),
46+
("Uusi laskenta", ["en:nutriscore-v2"]),
47+
("Novi izračun", ["en:nutriscore-v2"]),
48+
("Ново изчисление", ["en:nutriscore-v2"]),
49+
("NUTRI-SCORE Nouveau calcul", ["en:nutriscore", "en:nutriscore-v2"]),
3550
],
3651
)
3752
def test_find_labels(text: str, value_tags: list[str]):

0 commit comments

Comments
 (0)