From 4dde7bd8b5c7cc1197e8cc2e46dc6e6f48f9c4fa Mon Sep 17 00:00:00 2001 From: kisfenyo Date: Tue, 24 Feb 2026 16:10:42 +0100 Subject: [PATCH] Extract parenthesised notes from food name to extra field MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit E.g. "fehérborecet (ízlés szerint)" → food="fehérborecet", extra="ízlés szerint" Co-Authored-By: Claude Opus 4.6 --- app/scraper.py | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/app/scraper.py b/app/scraper.py index 68f6f0e..5189acd 100644 --- a/app/scraper.py +++ b/app/scraper.py @@ -221,6 +221,14 @@ def _parse_streetkitchen(soup: BeautifulSoup, url: str) -> dict: # Split "200g" → qty="200", unit="g" qty, unit = _split_qty_unit(qty_raw) + # Extract parenthesised note from inside food name + # e.g. "fehérborecet (ízlés szerint)" → food="fehérborecet", extra="ízlés szerint" + if not extra: + m = re.match(r"^(.+?)\s*\(([^)]+)\)\s*$", food) + if m: + food = m.group(1).strip() + extra = m.group(2).strip() + ingredients.append({ "quantity": qty, "unit": unit,