Spaces:

fffiloni
/

Image-to-Fragrance

Running on Zero

App Files Files Community

fffiloni commited on Jun 28

Commit

bb4631d

verified ·

1 Parent(s): 3d97999

try to handle all notes cases

Browse files

Files changed (1) hide show

app.py +41 -28

app.py CHANGED Viewed

@@ -78,6 +78,46 @@ Here is the scene description to analyze:
     cleaned_text = re.sub(pattern, '', output_text, flags=re.DOTALL)
     return cleaned_text
 def parse_perfume_description(text: str) -> dict:
     # Perfume Name
     perfume_name = re.search(r'Perfume Name:\s*(.+)', text).group(1).strip()
@@ -113,34 +153,7 @@ def parse_perfume_description(text: str) -> dict:
         image_desc = image_desc_match.group(1).strip() if image_desc_match else ""
     # 🗂️ Smart bullet extractor
-    def extract_notes(text, section_name):
-        # Try block of bullets
-        pattern_block = rf'{section_name}:\s*\n((?:\*.*(?:\n|$))+)'
-        match_block = re.search(pattern_block, text, re.MULTILINE)
-        if match_block:
-            notes_text = match_block.group(1)
-            notes = []
-            for line in notes_text.strip().splitlines():
-                bullet = line.strip().lstrip('*').strip()
-                if ':' in bullet:
-                    note, desc = bullet.split(':', 1)
-                    notes.append({'note': note.strip(), 'description': desc.strip()})
-                else:
-                    notes.append({'note': bullet, 'description': ''})
-            return notes
-        # Try inline bullet style: * Section: item1, item2, item3
-        pattern_inline = rf'\* {section_name}:\s*(.+)'
-        match_inline = re.search(pattern_inline, text)
-        if match_inline:
-            notes_raw = match_inline.group(1).strip()
-            notes = []
-            for item in notes_raw.split(','):
-                notes.append({'note': item.strip(), 'description': ''})
-            return notes
-        return []
     top_notes = extract_notes(text, 'Top Notes')
     heart_notes = extract_notes(text, 'Heart Notes')
     base_notes = extract_notes(text, 'Base Notes')

     cleaned_text = re.sub(pattern, '', output_text, flags=re.DOTALL)
     return cleaned_text
+def extract_notes(text, section_name):
+    import re
+    # 1. Try block of bullets
+    pattern_block = rf'{section_name}:\s*\n((?:\*.*(?:\n|$))+)'
+    match_block = re.search(pattern_block, text, re.MULTILINE)
+    if match_block:
+        notes_text = match_block.group(1)
+        notes = []
+        for line in notes_text.strip().splitlines():
+            bullet = line.strip().lstrip('*').strip()
+            if ':' in bullet:
+                note, desc = bullet.split(':', 1)
+                notes.append({'note': note.strip(), 'description': desc.strip()})
+            else:
+                notes.append({'note': bullet, 'description': ''})
+        return notes
+    # 2. Try inline bullet style: * Section: item1, item2, item3
+    pattern_inline = rf'\* {section_name}:\s*(.+)'
+    match_inline = re.search(pattern_inline, text)
+    if match_inline:
+        notes_raw = match_inline.group(1).strip()
+        notes = []
+        for item in notes_raw.split(','):
+            notes.append({'note': item.strip(), 'description': ''})
+        return notes
+    # 3. Try plain line style: Section: item1, item2, item3 (no bullet)
+    pattern_line = rf'^{section_name}:\s*(.+)$'
+    match_line = re.search(pattern_line, text, re.MULTILINE)
+    if match_line:
+        notes_raw = match_line.group(1).strip()
+        notes = []
+        for item in notes_raw.split(','):
+            notes.append({'note': item.strip(), 'description': ''})
+        return notes
+    return []
 def parse_perfume_description(text: str) -> dict:
     # Perfume Name
     perfume_name = re.search(r'Perfume Name:\s*(.+)', text).group(1).strip()
         image_desc = image_desc_match.group(1).strip() if image_desc_match else ""
     # 🗂️ Smart bullet extractor
     top_notes = extract_notes(text, 'Top Notes')
     heart_notes = extract_notes(text, 'Heart Notes')
     base_notes = extract_notes(text, 'Base Notes')