Spaces:

asdfaman
/

sadhya

Running

added llama-3bi, requirements.txt need to be updates

by RatanPrakash - opened Nov 23, 2024

←

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,6 +11,22 @@ import dateparser
 import os
 import matplotlib.pyplot as plt
 # Function to get Instagram post details
 import instaloader
 def get_instagram_post_details(post_url):
@@ -344,6 +360,16 @@ elif app_mode == "Task 1":
                 st.write(f"Extracting details from {uploaded_image.name}...")
                 result = ocr.ocr(img_array, cls=True)
                 # Process the OCR result to extract product name and properties
                 product_name, product_details = extract_product_info(result)

 import os
 import matplotlib.pyplot as plt
+# LLM Integration to extract product details. - Llama-3bi
+import torch
+from transformers import pipeline
+model_id = "meta-llama/Llama-3.2-3B-Instruct"
+pipe = pipeline(
+    "text-generation",
+    model=model_id,
+    torch_dtype=torch.bfloat16,
+    device_map="auto",
+)
+messages = [
+    {"role": "system", "content": """Your task is to get the product details out of the text given. The text given will be raw text from OCR of social media images of products,
+                                     and the goal is to get product details and description so that it can be used for amazon product listing. """},
+]
 # Function to get Instagram post details
 import instaloader
 def get_instagram_post_details(post_url):
                 st.write(f"Extracting details from {uploaded_image.name}...")
                 result = ocr.ocr(img_array, cls=True)
+                messages.append({"role": "user", "content": result})
+                outputs = pipe(
+                    messages,
+                    max_new_tokens=256,
+                )
+                productContent = outputs[0]["generated_text"][-1]
+                st.markdown(productContent)
                 # Process the OCR result to extract product name and properties
                 product_name, product_details = extract_product_info(result)