Spaces:

fffiloni
/

Image-to-Fragrance

Running on Zero

fffiloni commited on Jun 28

Commit

866755a

verified ·

1 Parent(s): 061f3b8

regex grab properly indented notes

Files changed (1) hide show

app.py CHANGED Viewed

@@ -72,13 +72,13 @@ def parse_perfume_description(text: str) -> dict:
     poetic_desc = re.search(r'Poetic Olfactory Description:\s*"(.*?)"', text, re.DOTALL).group(1).strip()
     general_atmosphere = re.search(r'General Atmosphere:\s*(.+)', text, re.DOTALL).group(1).strip()
-    # Helper for pyramid sections
     def extract_notes(section_name):
-        pattern = rf'{section_name}:\s*((?:\*\s.*\n?)+)'
-        match = re.search(pattern, text)
         if not match:
             return []
-        notes_text = match.group(1).strip()
         notes = re.findall(r'\*\s*(.*?):\s*(.*)', notes_text)
         return [{'note': note.strip(), 'description': desc.strip()} for note, desc in notes]

     poetic_desc = re.search(r'Poetic Olfactory Description:\s*"(.*?)"', text, re.DOTALL).group(1).strip()
     general_atmosphere = re.search(r'General Atmosphere:\s*(.+)', text, re.DOTALL).group(1).strip()
+    # More flexible notes extractor
     def extract_notes(section_name):
+        pattern = rf'{section_name}:\s*\n((?:\*.*(?:\n|$))+)'
+        match = re.search(pattern, text, re.MULTILINE)
         if not match:
             return []
+        notes_text = match.group(1)
         notes = re.findall(r'\*\s*(.*?):\s*(.*)', notes_text)
         return [{'note': note.strip(), 'description': desc.strip()} for note, desc in notes]