Spaces:

fffiloni
/

Image-to-Fragrance

Running on Zero

App Files Files Community

fffiloni commited on Jun 28

Commit

9065d18

verified ·

1 Parent(s): 866755a

handle the case where llm do not provide note description

Browse files

Files changed (1) hide show

app.py +32 -8

app.py CHANGED Viewed

@@ -66,27 +66,51 @@ Here is the scene description to analyze:
     return cleaned_text
 def parse_perfume_description(text: str) -> dict:
-    # Extract main fields
     perfume_name = re.search(r'Perfume Name:\s*(.+)', text).group(1).strip()
-    tagline = re.search(r'Tagline:\s*"(.*?)"', text, re.DOTALL).group(1).strip()
-    poetic_desc = re.search(r'Poetic Olfactory Description:\s*"(.*?)"', text, re.DOTALL).group(1).strip()
-    general_atmosphere = re.search(r'General Atmosphere:\s*(.+)', text, re.DOTALL).group(1).strip()
-    # More flexible notes extractor
     def extract_notes(section_name):
         pattern = rf'{section_name}:\s*\n((?:\*.*(?:\n|$))+)'
         match = re.search(pattern, text, re.MULTILINE)
         if not match:
             return []
         notes_text = match.group(1)
-        notes = re.findall(r'\*\s*(.*?):\s*(.*)', notes_text)
-        return [{'note': note.strip(), 'description': desc.strip()} for note, desc in notes]
     top_notes = extract_notes('Top Notes')
     heart_notes = extract_notes('Heart Notes')
     base_notes = extract_notes('Base Notes')
-    # Build final JSON structure
     result = {
         'Perfume Name': perfume_name,
         'Tagline': tagline,

     return cleaned_text
 def parse_perfume_description(text: str) -> dict:
+    # Perfume Name
     perfume_name = re.search(r'Perfume Name:\s*(.+)', text).group(1).strip()
+    # Tagline (still expects quotes)
+    tagline = re.search(r'Tagline:\s*"(.*?)"', text, re.DOTALL)
+    tagline = tagline.group(1).strip() if tagline else ""
+    # Poetic Olfactory Description: allow quoted or plain
+    poetic_desc_match = re.search(
+        r'Poetic Olfactory Description:\s*"(.*?)"', text, re.DOTALL)
+    if poetic_desc_match:
+        poetic_desc = poetic_desc_match.group(1).strip()
+    else:
+        # fallback: get everything until next section
+        poetic_desc_match = re.search(
+            r'Poetic Olfactory Description:\s*(.*?)\s*Olfactory Pyramid:', text, re.DOTALL)
+        poetic_desc = poetic_desc_match.group(1).strip() if poetic_desc_match else ""
+    # General Atmosphere: same idea
+    general_atmosphere_match = re.search(
+        r'General Atmosphere:\s*(.+)', text, re.DOTALL)
+    general_atmosphere = general_atmosphere_match.group(1).strip() if general_atmosphere_match else ""
+    # Flexible note extractor for bullet points
     def extract_notes(section_name):
         pattern = rf'{section_name}:\s*\n((?:\*.*(?:\n|$))+)'
         match = re.search(pattern, text, re.MULTILINE)
         if not match:
             return []
         notes_text = match.group(1)
+        notes = []
+        for line in notes_text.strip().splitlines():
+            bullet = line.strip().lstrip('*').strip()
+            # If it has ":", split note & description
+            if ':' in bullet:
+                note, desc = bullet.split(':', 1)
+                notes.append({'note': note.strip(), 'description': desc.strip()})
+            else:
+                notes.append({'note': bullet, 'description': ''})
+        return notes
     top_notes = extract_notes('Top Notes')
     heart_notes = extract_notes('Heart Notes')
     base_notes = extract_notes('Base Notes')
     result = {
         'Perfume Name': perfume_name,
         'Tagline': tagline,