Spaces:

ibombonato
/

nat-ad

Running

App Files Files Community

ibombonato commited on 18 days ago

Commit

94a7d52

verified ·

1 Parent(s): 3cdec01

Add Mercado Livre support (#4)

Browse files

- Add Mercado Livre support (472175aa7e87eff9693e48929495ceaa655412d3)

Files changed (19) hide show

.clinerules +91 -0
.gitattributes +3 -0
GEMINI.md +91 -0
README.md +13 -2
app.py +76 -133
assets/Montserrat-Bold.ttf +3 -0
assets/Montserrat-Regular.ttf +3 -0
assets/template_natura_empty.jpg +3 -0
generate_image_tool.py +101 -0
image_generator_tool.py +78 -0
main.py +66 -0
merchs/merch.py +73 -0
pyproject.toml +13 -0
scrape.py +46 -0
stealth_scrape_tool.py +10 -2
test_tool.py +13 -0
tests/test_utils_url_tool.py +38 -0
utils_tools.py +119 -0
uv.lock +46 -0

.clinerules ADDED Viewed

	@@ -0,0 +1,91 @@

+# Copilot Instructions for the Project
+## Ignore files and folders
+- You should ignore the files and folder bellow:
+  - .venv/
+  - .vscode/
+  - __pycache__/
+  - build/
+  - chroma.db/
+  - vibe_dspy.egg-info/
+- Ignore files that are mentioned inside .gitignore
+## Environment and Secrets
+- All credentials and config are loaded from `.env` using `python-dotenv`.
+- For DB access, use `DB_USER`, `DB_PASS_ENCODED`, `DB_HOST`, `DB_PORT`, `DB_DATABASE`.
+- For LLMs, use `AZURE_OPENAI_API_KEY`, `AZURE_OPENAI_ENDPOINT`, `AZURE_OPENAI_DEPLOYMENT_NAME`.
+## Conventions and Workflows
+- Always use environment variables for secrets and config.
+- Always use `uv run ` to run code and code tools
+- Always use `pytest` for unit tests and run then with `uv run pytest`.
+- Always use `uv` and `uv add` to manage dependencies.
+## References
+- See `README.md` for high-level goals and links.
+## Security and Environment File Handling
+- **Never read, modify, index, or delete any `.env` files.**
+- Do not access, print, or manipulate environment variable files (e.g., `.env`) in any way.
+- All environment configuration is managed outside of AI agent operations for security and compliance.
+## Commit Message Guidelines (Conventional Commits)
+All commit messages should adhere to the [Conventional Commits specification](https://www.conventionalcommits.org/en/v1.0.0/). This provides a standardized format for commit messages, making it easier to understand the purpose of a commit and to automate changelog generation.
+The basic structure of a commit message is:
+```
+<type>[optional scope]: <description>
+[optional body]
+[optional footer(s)]
+```
+### Type
+The `type` is a mandatory prefix that indicates the kind of change introduced by the commit. Common types include:
+*   `feat`: A new feature
+*   `fix`: A bug fix
+*   `docs`: Documentation only changes
+*   `style`: Changes that do not affect the meaning of the code (white-space, formatting, missing semicolons, etc.)
+*   `refactor`: A code change that neither fixes a bug nor adds a feature
+*   `perf`: A code change that improves performance
+*   `test`: Adding missing tests or correcting existing tests
+*   `build`: Changes that affect the build system or external dependencies (example scopes: npm, gulp, broccoli, make)
+*   `ci`: Changes to our CI configuration files and scripts (example scopes: Travis, Circle, BrowserStack, SauceLabs)
+*   `chore`: Other changes that don't modify src or test files
+*   `revert`: Reverts a previous commit
+### Scope (Optional)
+The `scope` provides additional contextual information about the change. It is enclosed in parentheses after the `type`. For example, `feat(parser): add ability to parse arrays`.
+### Description
+The `description` is a concise, imperative, present-tense summary of the change. It should not be capitalized and should not end with a period.
+### Body (Optional)
+The `body` provides a longer, more detailed explanation of the commit's changes. It should be separated from the description by a blank line.
+### Footer(s) (Optional)
+The `footer` can contain information about breaking changes, references to issues, or other metadata. Breaking changes should start with `BREAKING CHANGE:` followed by a description.
+### Examples
+*   `feat: add new user authentication module`
+*   `fix(auth): correct password validation bug`
+*   `docs: update README with installation instructions`
+*   `refactor(api): simplify error handling logic`
+*   `BREAKING CHANGE: refactor(core): remove old API endpoint`
+    `The /api/v1/old-endpoint has been removed. Use /api/v1/new-endpoint instead.`

.gitattributes CHANGED Viewed

@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+assets/Montserrat-Bold.ttf filter=lfs diff=lfs merge=lfs -text
+assets/Montserrat-Regular.ttf filter=lfs diff=lfs merge=lfs -text
+assets/template_natura_empty.jpg filter=lfs diff=lfs merge=lfs -text

GEMINI.md ADDED Viewed

	@@ -0,0 +1,91 @@

+# Copilot Instructions for the Project
+## Ignore files and folders
+- You should ignore the files and folder bellow:
+  - .venv/
+  - .vscode/
+  - __pycache__/
+  - build/
+  - chroma.db/
+  - vibe_dspy.egg-info/
+- Ignore files that are mentioned inside .gitignore
+## Environment and Secrets
+- All credentials and config are loaded from `.env` using `python-dotenv`.
+- For DB access, use `DB_USER`, `DB_PASS_ENCODED`, `DB_HOST`, `DB_PORT`, `DB_DATABASE`.
+- For LLMs, use `AZURE_OPENAI_API_KEY`, `AZURE_OPENAI_ENDPOINT`, `AZURE_OPENAI_DEPLOYMENT_NAME`.
+## Conventions and Workflows
+- Always use environment variables for secrets and config.
+- Always use `uv run ` to run code and code tools
+- Always use `pytest` for unit tests and run then with `uv run pytest`.
+- Always use `uv` and `uv add` to manage dependencies.
+## References
+- See `README.md` for high-level goals and links.
+## Security and Environment File Handling
+- **Never read, modify, index, or delete any `.env` files.**
+- Do not access, print, or manipulate environment variable files (e.g., `.env`) in any way.
+- All environment configuration is managed outside of AI agent operations for security and compliance.
+## Commit Message Guidelines (Conventional Commits)
+All commit messages should adhere to the [Conventional Commits specification](https://www.conventionalcommits.org/en/v1.0.0/). This provides a standardized format for commit messages, making it easier to understand the purpose of a commit and to automate changelog generation.
+The basic structure of a commit message is:
+```
+<type>[optional scope]: <description>
+[optional body]
+[optional footer(s)]
+```
+### Type
+The `type` is a mandatory prefix that indicates the kind of change introduced by the commit. Common types include:
+*   `feat`: A new feature
+*   `fix`: A bug fix
+*   `docs`: Documentation only changes
+*   `style`: Changes that do not affect the meaning of the code (white-space, formatting, missing semicolons, etc.)
+*   `refactor`: A code change that neither fixes a bug nor adds a feature
+*   `perf`: A code change that improves performance
+*   `test`: Adding missing tests or correcting existing tests
+*   `build`: Changes that affect the build system or external dependencies (example scopes: npm, gulp, broccoli, make)
+*   `ci`: Changes to our CI configuration files and scripts (example scopes: Travis, Circle, BrowserStack, SauceLabs)
+*   `chore`: Other changes that don't modify src or test files
+*   `revert`: Reverts a previous commit
+### Scope (Optional)
+The `scope` provides additional contextual information about the change. It is enclosed in parentheses after the `type`. For example, `feat(parser): add ability to parse arrays`.
+### Description
+The `description` is a concise, imperative, present-tense summary of the change. It should not be capitalized and should not end with a period.
+### Body (Optional)
+The `body` provides a longer, more detailed explanation of the commit's changes. It should be separated from the description by a blank line.
+### Footer(s) (Optional)
+The `footer` can contain information about breaking changes, references to issues, or other metadata. Breaking changes should start with `BREAKING CHANGE:` followed by a description.
+### Examples
+*   `feat: add new user authentication module`
+*   `fix(auth): correct password validation bug`
+*   `docs: update README with installation instructions`
+*   `refactor(api): simplify error handling logic`
+*   `BREAKING CHANGE: refactor(core): remove old API endpoint`
+    `The /api/v1/old-endpoint has been removed. Use /api/v1/new-endpoint instead.`

README.md CHANGED Viewed

@@ -9,7 +9,7 @@ This project leverages AI agents to automatically generate social media ad copy
 ## How it Works
-The system uses a Gradio interface (`app.py`) with two main tabs:
 1.  **Social Media Ad Generator:** This tab takes product URLs and other parameters as input. Behind the scenes, a "crew" of AI agents, each with a specific role, processes this information:
     *   **Product Analyst:** This agent scrapes a product URL to extract key information like the product name, features, price, and any available discounts. It also uses a tool to shorten the URL.
@@ -19,6 +19,12 @@ The system uses a Gradio interface (`app.py`) with two main tabs:
     *   **Expert Perfume Analyst and Web Data Extractor:** This agent extracts detailed perfume information (notes, accords, longevity, sillage, similar fragrances, reviews) from the Fragrantica page.
     *   **Fragrance Expert Woman and Perfume Analysis Reporter:** This agent synthesizes the extracted data into a human-friendly report, including graded evaluations and personalized recommendations.
 ## Setup and Usage
 1.  **Prerequisites:**
@@ -33,7 +39,7 @@ The system uses a Gradio interface (`app.py`) with two main tabs:
         ```
     *   Run the Docker container, mapping port 7860 and passing API keys as environment variables:
         ```bash
-        docker run -p 7860:7860 -e OPENAI_API_KEY="your_openai_api_key" -e NATURA_API_TOKEN="your_natura_api_token" -e OPENAI_BASE_URL="your_openai_base_url" -e OPENAI_MODEL_NAME="your_openai_model_name" natura-ads
         ```
     *   Access the Gradio interface in your web browser at `http://localhost:7860`.
@@ -42,6 +48,8 @@ The system uses a Gradio interface (`app.py`) with two main tabs:
 *   `app.py`: The Gradio application that provides the user interface.
 *   `social_media_crew.py`: Defines the AI agents and their tasks for social media ad generation.
 *   `fragrantica_crew.py`: Defines the AI agents and their tasks for Fragrantica website analysis.
 *   `stealth_scrape_tool.py`: A custom tool for stealthy web scraping using Playwright.
 *   `shortener_tool.py`: A custom tool for shortening URLs.
 *   `Dockerfile`: Defines the Docker image for deploying the application.
@@ -53,3 +61,6 @@ The system uses a Gradio interface (`app.py`) with two main tabs:
 - [x] Add support for any model/api key supported by LiteLLM.
 - [x] Add Fragrantica support, where user will input a Fragrantica URL and the agent will extract and generate a Perfume Analysis report.

 ## How it Works
+The system uses a Gradio interface (`app.py`) with three main tabs:
 1.  **Social Media Ad Generator:** This tab takes product URLs and other parameters as input. Behind the scenes, a "crew" of AI agents, each with a specific role, processes this information:
     *   **Product Analyst:** This agent scrapes a product URL to extract key information like the product name, features, price, and any available discounts. It also uses a tool to shorten the URL.
     *   **Expert Perfume Analyst and Web Data Extractor:** This agent extracts detailed perfume information (notes, accords, longevity, sillage, similar fragrances, reviews) from the Fragrantica page.
     *   **Fragrance Expert Woman and Perfume Analysis Reporter:** This agent synthesizes the extracted data into a human-friendly report, including graded evaluations and personalized recommendations.
+3.  **Image Ad Generator:** This tab allows users to generate a promotional image for a product. It takes the product name, original price, final price, a coupon code, and a product image URL as input. The tool then generates a promotional image with this information, based on a template.
+## Merchant Support
+The application now supports generating ad copy for both **Natura** and **Mercado Livre** products. The `merchs/merch.py` file defines a `Merchant` class with two subclasses: `NaturaMerchant` and `MercadoLivreMerchant`. This allows the application to use different templates and URL shorteners for each merchant.
 ## Setup and Usage
 1.  **Prerequisites:**
         ```
     *   Run the Docker container, mapping port 7860 and passing API keys as environment variables:
         ```bash
+        docker run --rm -p 7860:7860 -e OPENAI_API_KEY="your_openai_api_key" -e NATURA_API_TOKEN="your_natura_api_token" -e OPENAI_BASE_URL="your_openai_base_url" -e OPENAI_MODEL_NAME="your_openai_model_name" natura-ads
         ```
     *   Access the Gradio interface in your web browser at `http://localhost:7860`.
 *   `app.py`: The Gradio application that provides the user interface.
 *   `social_media_crew.py`: Defines the AI agents and their tasks for social media ad generation.
 *   `fragrantica_crew.py`: Defines the AI agents and their tasks for Fragrantica website analysis.
+*   `merchs/merch.py`: Defines the merchant-specific logic for Natura and Mercado Livre.
+*   `generate_image_tool.py`: A tool to generate promotional images for products.
 *   `stealth_scrape_tool.py`: A custom tool for stealthy web scraping using Playwright.
 *   `shortener_tool.py`: A custom tool for shortening URLs.
 *   `Dockerfile`: Defines the Docker image for deploying the application.
 - [x] Add support for any model/api key supported by LiteLLM.
 - [x] Add Fragrantica support, where user will input a Fragrantica URL and the agent will extract and generate a Perfume Analysis report.
+- [x] Support Mercado Livre Merchant
+- [wip] Add image templates
+- [] Create carroussel images for Fragrantica post

app.py CHANGED Viewed

@@ -2,95 +2,13 @@ import gradio as gr
 import os
 import requests
 from crewai import Agent, Task, Crew, Process, LLM
-from crewai_tools import ScrapeWebsiteTool
-from crewai.tools import BaseTool
 from dotenv import load_dotenv
 from stealth_scrape_tool import StealthScrapeTool
-load_dotenv()
-class ShortenerTool(BaseTool):
-    name: str = "URL Shortener Tool"
-    description: str = "Generates a short version of a given URL using an external API."
-    natura_api_token: str
-    def _run(self, original_url: str) -> str:
-        api_url = "https://sales-mgmt-cb-bff-apigw.prd.naturacloud.com/cb-bff-cms/cms/shortener"
-        headers = {"authorization": f"Bearer {self.natura_api_token}", "content-type": "application/json"}
-        payload = {"url": original_url}
-        try:
-            response = requests.post(api_url, headers=headers, json=payload)
-            response.raise_for_status()
-            short_url_data = response.json()
-            return short_url_data.get("short", original_url)
-        except requests.exceptions.RequestException as e:
-            print(f"Warning: Error generating short URL: {e}. Returning original URL.")
-            return original_url
-        except ValueError:
-            print("Warning: Invalid JSON response from shortener API. Returning original URL.")
-            return original_url
-class CalculateDiscountedPriceTool(BaseTool):
-    """
-    A tool to calculate the final price of an item after a discount is applied.
-    """
-    name: str = "Calculate Discounted Price Tool"
-    description: str = "Calculates the price after applying a given discount percentage."
-    def _run(self, original_price: float, discount_percentage: float) -> float:
-        """Calculates the discounted price and the total discount amount.
-        This method takes an original price and a discount percentage, validates
-        the inputs, and then computes the final price after the discount is
-        applied, as well as the amount saved.
-        Args:
-            original_price: The initial price of the item as a float or integer.
-        Returns:
-            float:
-                - The final discounted price, rounded to 2 decimal places.
-        """
-        if not isinstance(original_price, (int, float)) or not isinstance(discount_percentage, (int, float)):
-            raise ValueError("Both original_price and discount_percentage must be numbers.")
-        if discount_percentage < 0 or discount_percentage > 100:
-            raise ValueError("Discount percentage must be between 0 and 100.")
-        discount_amount = original_price * (discount_percentage / 100)
-        discounted_price = original_price - discount_amount
-        return round(discounted_price, 2)
-class CalculateDiscountValueTool(BaseTool):
-    """
-    A tool to calculate the final discount value of an item after comparing the original value and the final value.
-    """
-    name: str = "Calculate Discount Value Tool"
-    description: str = "Calculates the discount value after comparing two values."
-    def _run(self, original_price: float, final_price: float) -> float:
-        """Calculates the total discounted amount give the original and final price.
-        This method takes an original price and a final price, validates
-        the inputs, and then computes the final discounted value.
-        Args:
-            original_price: The initial price of the item as a float or integer.
-            final_price: The final price after discount as a float or integer.
-        Returns:
-            float:
-                - The final discount value, rounded to 0 decimal places.
-        """
-        if not isinstance(original_price, (int, float)) or not isinstance(final_price, (int, float)):
-            raise ValueError("Both original_price and final_price must be numbers.")
-        discount_value = original_price - final_price
-        discount_percentage = (discount_value / original_price) * 100
-        return round(discount_percentage, 0)
 class SocialMediaCrew:
     def __init__(self, openai_api_key: str, natura_api_token: str, openai_base_url: str, openai_model_name: str):
@@ -99,9 +17,10 @@ class SocialMediaCrew:
         self.openai_base_url = openai_base_url
         self.openai_model_name = openai_model_name
         self.scrape_tool = StealthScrapeTool() #ScrapeWebsiteTool()
-        self.shortener_tool = ShortenerTool(natura_api_token=self.natura_api_token)
         self.calculate_discounted_price_tool = CalculateDiscountedPriceTool()
         self.calculate_discount_value_tool = CalculateDiscountValueTool()
         print("Initializing SocialMediaCrew with BASE URL:", self.openai_base_url)
         print("Using OpenAI Model:", self.openai_model_name)
@@ -119,7 +38,6 @@ class SocialMediaCrew:
             backstory=("You are an expert in analyzing product pages and extracting the most important information. You can identify the product name, its main features, and the target audience."),
             verbose=True,
             tools=[self.scrape_tool,
-                   self.shortener_tool,
                    self.calculate_discounted_price_tool,
                    self.calculate_discount_value_tool],
             allow_delegation=False,
@@ -132,18 +50,19 @@ class SocialMediaCrew:
             goal='Create a compelling social media post in Portuguese to sell the product',
             backstory=("You are a creative copywriter specialized in the beauty and fragrance market. You know how to craft posts that are engaging, persuasive, and tailored for a Portuguese-speaking audience. You are an expert in using emojis and hashtags to increase engagement."),
             verbose=True,
             allow_delegation=False,
             llm=llm,
             max_retries=3
         )
-    def run_crew(self, product_url: str, main_cupom: str, main_cupom_discount_percentage: float, cupom_1: str, cupom_2: str) -> str:
         headers = {
             "accept": "*/*",
             "accept-language": "pt-BR,pt;q=0.9,en-US;q=0.8,en;q=0.7",
-            "sec-ch-ua": '"Not)A;Brand";v="8", "Chromium";v="138", "Google Chrome";v="138"' ,
             "sec-ch-ua-mobile": "?0",
-            "sec-ch-ua-platform": '"Windows"' ,
             "sec-fetch-dest": "empty",
             "sec-fetch-mode": "cors",
             "sec-fetch-site": "cross-site",
@@ -153,48 +72,58 @@ class SocialMediaCrew:
             response = requests.get(product_url, headers=headers)
             response.raise_for_status()
             if '<template data-dgst="NEXT_NOT_FOUND">' in response.text:
-                return "INVALID_URL"
         except requests.exceptions.RequestException as e:
             print(f"Error checking URL: {e}")
-            return "INVALID_URL"
-        analyze_product_task = Task(
-            description=(f"1. Scrape the content of the URL: {product_url} using the 'scrape_tool' with css_element = '.product-detail-banner'.\n2. Identify and extract the original product price and the final discounted price if existing. IGNORE any price breakdowns like 'produto' or 'consultoria'.\n3. Extract the product name, key characteristics, and any other relevant DISCOUNT available.\n4. Use the 'Calculate Discounted Price Tool' with the extracted final best price and the provided DISCOUNT PERCENTAGE ({main_cupom_discount_percentage}) to get the CUPOM DISCOUNTED PRICE.\n4.1 Use the 'Calculate Discount Value Tool' with ORIGINAL PRICE and CUPOM DISCOUNTED PRICE to get the TOTAL DISCOUNT PERCENTAGE.\n5. Use the 'URL Shortener Tool' to generate a short URL for {product_url}. If the shortener tool returns an error, use the original URL.\n6. Provide all this information, including the product name, ORIGINAL PRICE, DISCOUNTED PRICE  (the one used as the input in the tool 'Calculate Discounted Price Tool'), 2) CUPOM DISCOUNTED PRICE, and the generated short URL (or the original if the shortener failed). If any of this information cannot be extracted, you MUST return 'MISSING_PRODUCT_INFO'."),
             agent=self.product_analyst,
-            expected_output="A concise summary of the product including its name, key features, unique selling points, ORIGINAL PRICE, DISCOUNTED PRICE (the one used as the input in the tool 'Calculate Discounted Price Tool'), CUPOM DISCOUNTED PRICE, TOTAL DISCOUNT PERCENTAGE, and the SHORT SHAREABLE URL (or the original if the shortener failed), OR 'MISSING_PRODUCT_INFO' if essential product details are not found."
         )
-        create_post_task = Task(
-            description=(f"""Based on the product analysis, create a CONCISE and DIRECT social media post in Portuguese, suitable for a WhatsApp group.
- If the input you receive is 'INVALID_URL' or 'MISSING_PRODUCT_INFO', you MUST stop and output only that same message.
- The post should strictly follow this template:
- ###Template:
-{{Title}}
-{{Description}}
-De ~~{{ORIGINAL PRICE}}~~
-🔥Por {{CUPOM DISCOUNTED PRICE}} 🔥
-🔥 {{TOTAL DISCOUNT PERCENTAGE}}% OFF!
-🎟️ USE O CUPOM >>> {main_cupom}
-🛒 Link >>> {{short_url}}
-`🎟️ *Cupom válido para a primeira compra no link Minha Loja Natura, mesmo se já comprou no app ou link antigo. Demais compras ou app, use o cupom {cupom_1} ou {cupom_2} (o desconto é um pouco menor)`
-`‼️ Faça login nesse link com o mesmo email e senha que já usa pra comprar Natura!`
-###End Template
-Ensure a URL is always present in the output. Include a clear call to action and a MAXIMUM of 2 relevant emojis. DO NOT include hashtags. Keep it short and impactful and does not forget to include the backticks around the last paragraph.
- If the input you receive is 'INVALID_URL', you MUST stop and output only 'INVALID_URL'."""),
             agent=self.social_media_copywriter,
             expected_output="A short, direct, and impactful social media post in Portuguese for WhatsApp, strictly following the provided template, including the FINAL PRICE, any DISCOUNT, the SHORT SHAREABLE URL, a call to action, and up to 2 emojis, one in the Title and another in the Description. No hashtags should be present. A URL must always be present in the final output, OR the message 'INVALID_URL' or 'MISSING_PRODUCT_INFO' if the page was not found or product info is missing.",
             context=[analyze_product_task]
         )
         crew = Crew(
             agents=[self.product_analyst, self.social_media_copywriter],
             tasks=[analyze_product_task, create_post_task],
@@ -212,19 +141,25 @@ def clean_env_vars():
     os.environ.pop("OPENAI_MODEL_NAME", None)
 # --- Gradio Interface ---
-def generate_ad(product_url: str, main_cupom: str, main_cupom_discount_percentage: float, cupom_1: str, cupom_2: str, openai_api_key: str, natura_api_token: str, openai_base_url: str, openai_model_name: str):
     if not openai_api_key or not natura_api_token or not openai_model_name or not openai_base_url:
-        return "Please configure your API keys in the settings section below."
     social_media_crew = SocialMediaCrew(openai_api_key, natura_api_token, openai_base_url, openai_model_name)
-    result = social_media_crew.run_crew(product_url, main_cupom, main_cupom_discount_percentage, cupom_1, cupom_2)
     if result == "INVALID_URL":
-        return "❌ The provided URL is invalid or the product page could not be found."
     elif result == "MISSING_PRODUCT_INFO":
-        return "⚠️ Could not extract all required product information from the URL. Please check the URL or try a different one."
     else:
-        return result.raw
 with gr.Blocks() as demo:
     gr.Markdown("# 🚀 Social Media Ad Generator")
@@ -232,12 +167,16 @@ with gr.Blocks() as demo:
     with gr.Tab("Generate Ad"):
         url_input = gr.Textbox(label="Product URL", placeholder="Enter product URL here...")
         main_cupom_input = gr.Textbox(label="Main Cupom (e.g., PRIMEIRACOMPRA)", value="PRIMEIRACOMPRA")
-        main_cupom_discount_percentage_input = gr.Number(label="Main Cupom Discount Percentage (e.g., 20 for 20%)", value=20, minimum=0, maximum=100)
         cupom_1_input = gr.Textbox(label="Cupom 1 (e.g., AMIGO15)", placeholder="Enter first coupon code...")
-        cupom_2_input = gr.Textbox(label="Cupom 2 (e.g., JULHOA)", placeholder="Enter second coupon code...")
-        generate_button = gr.Button("Generate Ad")
         ad_output = gr.Markdown(label="Your Generated Ad", show_copy_button=True)
     with gr.Tab("Fragrantica"):
@@ -258,8 +197,12 @@ with gr.Blocks() as demo:
         # No save button needed as keys are passed directly
         gr.Markdown("API keys are used directly from these fields when you click 'Generate Ad'. They are not saved persistently.")
-    generate_button.click(generate_ad, inputs=[url_input, main_cupom_input, main_cupom_discount_percentage_input, cupom_1_input, cupom_2_input, openai_key_input, natura_token_input, openai_base_url_input, openai_model_name_input], outputs=ad_output)
     # Placeholder for Fragrantica analysis function
     def analyze_fragrantica_url(url, openai_api_key, natura_api_token, openai_base_url, openai_model_name):
         if not openai_api_key or not openai_model_name or not openai_base_url:

 import os
 import requests
 from crewai import Agent, Task, Crew, Process, LLM
 from dotenv import load_dotenv
 from stealth_scrape_tool import StealthScrapeTool
+from image_generator_tool import GenerateImageTool
+from utils_tools import CalculateDiscountedPriceTool, CalculateDiscountValueTool, GetImageUrlTool, MerchantSelectorTool
+load_dotenv()
 class SocialMediaCrew:
     def __init__(self, openai_api_key: str, natura_api_token: str, openai_base_url: str, openai_model_name: str):
         self.openai_base_url = openai_base_url
         self.openai_model_name = openai_model_name
         self.scrape_tool = StealthScrapeTool() #ScrapeWebsiteTool()
         self.calculate_discounted_price_tool = CalculateDiscountedPriceTool()
         self.calculate_discount_value_tool = CalculateDiscountValueTool()
+        self.image_generator_tool = GenerateImageTool()
+        self.merchant_selector_tool = MerchantSelectorTool(natura_api_token=self.natura_api_token)
         print("Initializing SocialMediaCrew with BASE URL:", self.openai_base_url)
         print("Using OpenAI Model:", self.openai_model_name)
             backstory=("You are an expert in analyzing product pages and extracting the most important information. You can identify the product name, its main features, and the target audience."),
             verbose=True,
             tools=[self.scrape_tool,
                    self.calculate_discounted_price_tool,
                    self.calculate_discount_value_tool],
             allow_delegation=False,
             goal='Create a compelling social media post in Portuguese to sell the product',
             backstory=("You are a creative copywriter specialized in the beauty and fragrance market. You know how to craft posts that are engaging, persuasive, and tailored for a Portuguese-speaking audience. You are an expert in using emojis and hashtags to increase engagement."),
             verbose=True,
+            tools=[self.image_generator_tool],
             allow_delegation=False,
             llm=llm,
             max_retries=3
         )
+    def _validate_url(self, product_url: str) -> bool:
         headers = {
             "accept": "*/*",
             "accept-language": "pt-BR,pt;q=0.9,en-US;q=0.8,en;q=0.7",
+            "sec-ch-ua": '"Not)A;Brand";v="8", "Chromium";v="138", "Google Chrome";v="138"',
             "sec-ch-ua-mobile": "?0",
+            "sec-ch-ua-platform": '"Windows"',
             "sec-fetch-dest": "empty",
             "sec-fetch-mode": "cors",
             "sec-fetch-site": "cross-site",
             response = requests.get(product_url, headers=headers)
             response.raise_for_status()
             if '<template data-dgst="NEXT_NOT_FOUND">' in response.text:
+                return False
+            return True
         except requests.exceptions.RequestException as e:
             print(f"Error checking URL: {e}")
+            return False
+    def _prepare_merchant(self, product_url: str):
+        merchant = self.merchant_selector_tool.run(product_url)
+        css_selector = merchant.get_css_selector()
+        short_url = merchant.shorten_url(product_url)
+        return merchant, css_selector, short_url
+    def _create_analyze_product_task(self, product_url: str, css_selector: str, main_cupom_discount_percentage: float, short_url: str, original_price: float, discounted_price: float) -> Task:
+        task_description = (f"1. Scrape the content of the URL: {product_url} using the 'scrape_tool' with css_element = '{css_selector}'.\n"
+                            "2. Extract the product name, key characteristics, and any other relevant DISCOUNT available.\n")
+        if original_price is not None and original_price > 0 and discounted_price is not None and discounted_price > 0:
+            task_description += (f"3. The user has provided the prices. Use ORIGINAL PRICE = {original_price} and DISCOUNTED PRICE = {discounted_price}.\n")
+            final_best_price_source = str(discounted_price)
+        else:
+            task_description += ("3. Identify and extract the original product price and the final discounted price if existing from the scraped content. "
+                                 "IGNORE any price breakdowns like 'produto' or 'consultoria'.\n")
+            final_best_price_source = "the extracted final best price"
+        task_description += (f"4. Use the 'Calculate Discounted Price Tool' with {final_best_price_source} and the provided DISCOUNT PERCENTAGE ({main_cupom_discount_percentage}) to get the CUPOM DISCOUNTED PRICE.\n"
+                             "4.1 Use the 'Calculate Discount Value Tool' with ORIGINAL PRICE and CUPOM DISCOUNTED PRICE to get the TOTAL DISCOUNT PERCENTAGE.\n"
+                             f"5. Provide all this information, including the product name, ORIGINAL PRICE, DISCOUNTED PRICE (the one from step 3), CUPOM DISCOUNTED PRICE, and the generated short URL ({short_url}). If any of this information cannot be extracted, you MUST return 'MISSING_PRODUCT_INFO'.")
+        return Task(
+            description=task_description,
             agent=self.product_analyst,
+            expected_output="A concise summary of the product including its name, key features, unique selling points, ORIGINAL PRICE, DISCOUNTED PRICE (the one used as the input in the tool 'Calculate Discounted Price Tool'), CUPOM DISCOUNTED PRICE, TOTAL DISCOUNT PERCENTAGE, and the SHORT SHAREABLE URL ({short_url}), OR 'MISSING_PRODUCT_INFO' if essential product details are not found."
         )
+    def _create_post_task(self, analyze_product_task: Task, merchant, main_cupom: str, cupom_1: str, store_name: str) -> Task:
+        template = merchant.get_template(main_cupom, cupom_1, store=store_name)
+        return Task(
+            description=(f"Based on the product analysis, create a CONCISE and DIRECT social media post in Portuguese, suitable for a WhatsApp group. \n If the input you receive is 'INVALID_URL' or 'MISSING_PRODUCT_INFO', you MUST stop and output only that same message.\n The post should strictly follow this template:\n {template}\n\nEnsure a URL is always present in the output. Include a clear call to action and a MAXIMUM of 2 relevant emojis. DO NOT include hashtags. Keep it short and impactful and does not forget to include the backticks around the last paragraph.\n\n If the input you receive is 'INVALID_URL', you MUST stop and output only 'INVALID_URL'."),
             agent=self.social_media_copywriter,
             expected_output="A short, direct, and impactful social media post in Portuguese for WhatsApp, strictly following the provided template, including the FINAL PRICE, any DISCOUNT, the SHORT SHAREABLE URL, a call to action, and up to 2 emojis, one in the Title and another in the Description. No hashtags should be present. A URL must always be present in the final output, OR the message 'INVALID_URL' or 'MISSING_PRODUCT_INFO' if the page was not found or product info is missing.",
             context=[analyze_product_task]
         )
+    def run_crew(self, product_url: str, store_name: str, main_cupom: str, main_cupom_discount_percentage: float, cupom_1: str, original_price: float, discounted_price: float) -> str:
+        if not self._validate_url(product_url):
+            return "INVALID_URL"
+        merchant, css_selector, short_url = self._prepare_merchant(product_url)
+        analyze_product_task = self._create_analyze_product_task(product_url, css_selector, main_cupom_discount_percentage, short_url, original_price, discounted_price)
+        create_post_task = self._create_post_task(analyze_product_task, merchant, main_cupom, cupom_1, store_name)
         crew = Crew(
             agents=[self.product_analyst, self.social_media_copywriter],
             tasks=[analyze_product_task, create_post_task],
     os.environ.pop("OPENAI_MODEL_NAME", None)
 # --- Gradio Interface ---
+def generate_ad(product_url: str, store_name: str, main_cupom: str, main_cupom_discount_percentage: float, cupom_1: str, original_price: float, discounted_price: float, openai_api_key: str, natura_api_token: str, openai_base_url: str, openai_model_name: str):
+    yield gr.update(interactive=False, value="Generating..."), gr.Markdown(value="⏳ Generating ad... Please wait.")
     if not openai_api_key or not natura_api_token or not openai_model_name or not openai_base_url:
+        yield gr.update(interactive=True, value="Generate Ad"), gr.Markdown(value="Please configure your API keys in the settings section below.")
+        return
+    original_price = original_price if original_price is not None else 0
+    discounted_price = discounted_price if discounted_price is not None else 0
     social_media_crew = SocialMediaCrew(openai_api_key, natura_api_token, openai_base_url, openai_model_name)
+    result = social_media_crew.run_crew(product_url, store_name, main_cupom, main_cupom_discount_percentage, cupom_1, original_price, discounted_price)
     if result == "INVALID_URL":
+        yield gr.update(interactive=True, value="Generate Ad"), gr.Markdown(value="❌ The provided URL is invalid or the product page could not be found.")
     elif result == "MISSING_PRODUCT_INFO":
+        yield gr.update(interactive=True, value="Generate Ad"), gr.Markdown(value="⚠️ Could not extract all required product information from the URL. Please check the URL or try a different one.")
     else:
+        yield gr.update(interactive=True, value="Generate Ad"), gr.Markdown(value=result.raw)
 with gr.Blocks() as demo:
     gr.Markdown("# 🚀 Social Media Ad Generator")
     with gr.Tab("Generate Ad"):
         url_input = gr.Textbox(label="Product URL", placeholder="Enter product URL here...")
+        store_name_input = gr.Textbox(label="Store Name (e.g., O Boticário)", placeholder="Enter store name...")
         main_cupom_input = gr.Textbox(label="Main Cupom (e.g., PRIMEIRACOMPRA)", value="PRIMEIRACOMPRA")
+        main_cupom_discount_percentage_input = gr.Number(label="Main Cupom Discount Percentage (e.g., 20 for 20%)", value=15, minimum=0, maximum=100)
         cupom_1_input = gr.Textbox(label="Cupom 1 (e.g., AMIGO15)", placeholder="Enter first coupon code...")
+        original_price_input = gr.Number(label="Original Price (Optional)", value=0, minimum=0)
+        discounted_price_input = gr.Number(label="Discounted Price (Optional)", value=0, minimum=0)
+        with gr.Row():
+            generate_button = gr.Button("Generate Ad")
+            clear_button = gr.Button("Clear")
         ad_output = gr.Markdown(label="Your Generated Ad", show_copy_button=True)
     with gr.Tab("Fragrantica"):
         # No save button needed as keys are passed directly
         gr.Markdown("API keys are used directly from these fields when you click 'Generate Ad'. They are not saved persistently.")
+    def clear_fields():
+        return "", 0, 0
+    generate_button.click(generate_ad, inputs=[url_input, store_name_input, main_cupom_input, main_cupom_discount_percentage_input, cupom_1_input, original_price_input, discounted_price_input, openai_key_input, natura_token_input, openai_base_url_input, openai_model_name_input], outputs=[generate_button, ad_output])
+    clear_button.click(clear_fields, inputs=[], outputs=[url_input, original_price_input, discounted_price_input])
     # Placeholder for Fragrantica analysis function
     def analyze_fragrantica_url(url, openai_api_key, natura_api_token, openai_base_url, openai_model_name):
         if not openai_api_key or not openai_model_name or not openai_base_url:

assets/Montserrat-Bold.ttf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:846d5823e5c909a5aad49efbd71dd5f3320a8640fff86840bf7d529c8d8660a5
+size 335788

assets/Montserrat-Regular.ttf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5a3f02c4a72f1da11c6dadf4fd78c07b2f145a34ed46eb875ed0da28cbd348c
+size 330948

assets/template_natura_empty.jpg ADDED Viewed

Git LFS Details

SHA256: 43b40b4ee2cfc678845fceecec9f1f2610ed25685d937dd5c5c52ea9eeac77c1
Pointer size: 131 Bytes
Size of remote file: 235 kB

generate_image_tool.py ADDED Viewed

	@@ -0,0 +1,101 @@

+import requests
+from PIL import Image, ImageDraw, ImageFont
+from io import BytesIO
+import uuid
+# --- 1. SETUP: Define your data ---
+# Input and Output files
+template_path = 'template_natura_empty.jpg'
+output_path = f'{uuid.uuid4()}.png'
+# Image to place on the template
+# NOTE: Replace this with parameters
+product_image_url = 'https://production.na01.natura.com/on/demandware.static/-/Sites-natura-br-storefront-catalog/default/dw68595724/NATBRA-89834_1.jpg'
+product_name = "Homem Cor.agio"
+original_price = "De: R$ 399,00"
+final_price = "Por: R$ 167,92"
+coupon_code = "AGOSTOA"
+# --- 2. IMAGE PROCESSING ---
+try:
+    # Load the base template image
+    template_image = Image.open(template_path).convert("RGBA")
+    # Fetch the product image from the URL
+    response = requests.get(product_image_url)
+    product_image_data = BytesIO(response.content)
+    product_image = Image.open(product_image_data).convert("RGBA")
+    # Define the position and size for the product image placeholder
+    # These coordinates were estimated from your template (width, height)
+    box_size = (442, 353)
+    box_position = (140, 280) # (x, y) from top-left corner
+    # --- KEY CHANGE 1: Resize image while preserving aspect ratio ---
+    # The thumbnail method resizes the image to fit within the box_size
+    # without changing its aspect ratio. It modifies the image in-place.
+    product_image_resized = product_image.copy() # Work on a copy
+    product_image_resized.thumbnail(box_size)
+    # --- KEY CHANGE 2: Calculate position to center the image ---
+    # Find the top-left corner to paste the image so it's centered in the box
+    paste_x = box_position[0] + (box_size[0] - product_image_resized.width) // 2
+    paste_y = box_position[1] + (box_size[1] - product_image_resized.height) // 2
+    paste_position = (paste_x, paste_y)
+    # Paste the resized product image onto the template
+    template_image.paste(product_image_resized, paste_position, product_image_resized)
+    # --- 3. TEXT DRAWING ---
+    # Create a drawing context
+    draw = ImageDraw.Draw(template_image)
+    # Define fonts. For best results, download a font like 'Montserrat' and provide the path.
+    # Using a default font if a specific one isn't found.
+    try:
+        font_name = ImageFont.truetype("Montserrat-Bold.ttf", 47)
+        font_price_from = ImageFont.truetype("Montserrat-Regular.ttf", 28)
+        font_price = ImageFont.truetype("Montserrat-Bold.ttf", 47)
+        font_cupom = ImageFont.truetype("Montserrat-Bold.ttf", 33)
+    except IOError:
+        print("Arial font not found. Using default font.")
+        font_bold = ImageFont.load_default()
+        font_regular = ImageFont.load_default()
+        font_price = ImageFont.load_default()
+        font_cupom = ImageFont.load_default()
+    # Define text colors
+    white_color = "#FFFFFF"
+    yellow_color = "#FEE161" # A yellow sampled from your design
+    black_color = "#000000"
+    # Add text to the image
+    # The 'anchor="ms"' centers the text horizontally at the given x-coordinate
+    # 1. Product Name
+    draw.text((360, 710), product_name, font=font_name, fill=white_color, anchor="ms")
+    # 2. Original Price
+    draw.text((360, 800), original_price, font=font_price_from, fill=white_color, anchor="ms")
+    # 3. Final Price
+    draw.text((360, 860), final_price, font=font_price, fill=yellow_color, anchor="ms")
+    # 4. Coupon Code
+    draw.text((360, 993), coupon_code, font=font_cupom, fill=black_color, anchor="ms")
+    # --- 4. SAVE THE FINAL IMAGE ---
+    # Save the result as a PNG to preserve quality
+    template_image.save(output_path)
+    print(f"✨ Success! Image saved as '{output_path}'")
+except FileNotFoundError:
+    print(f"Error: The template file '{template_path}' was not found.")
+except Exception as e:
+    print(f"An error occurred: {e}")

image_generator_tool.py ADDED Viewed

	@@ -0,0 +1,78 @@

+from crewai.tools import BaseTool
+from pydantic import BaseModel, Field
+from PIL import Image, ImageDraw, ImageFont
+import requests
+from io import BytesIO
+import uuid
+class GenerateImageToolInput(BaseModel):
+    """Input for the Generate Image Tool."""
+    product_image_url: str = Field(..., description="URL of the product image to be placed on the template.")
+    product_name: str = Field(..., description="Name of the product.")
+    original_price: str = Field(..., description="Original price of the product.")
+    final_price: str = Field(..., description="Final price of the product.")
+    coupon_code: str = Field(..., description="Coupon code to be displayed on the image.")
+import tempfile
+import os
+class GenerateImageTool(BaseTool):
+    name: str = "Generate Image Tool"
+    description: str = "Generates a promotional image for a product using a template."
+    args_schema = GenerateImageToolInput
+    def _run(self, product_image_url: str, product_name: str, original_price: str, final_price: str, coupon_code: str) -> str:
+        template_path = 'assets/template_natura_empty.jpg'
+        temp_dir = tempfile.gettempdir()
+        output_path = os.path.join(temp_dir, f'{uuid.uuid4()}.png')
+        try:
+            template_image = Image.open(template_path).convert("RGBA")
+            response = requests.get(product_image_url)
+            product_image_data = BytesIO(response.content)
+            product_image = Image.open(product_image_data).convert("RGBA")
+            box_size = (442, 353)
+            box_position = (140, 280)
+            product_image_resized = product_image.copy()
+            product_image_resized.thumbnail(box_size)
+            paste_x = box_position[0] + (box_size[0] - product_image_resized.width) // 2
+            paste_y = box_position[1] + (box_size[1] - product_image_resized.height) // 2
+            paste_position = (paste_x, paste_y)
+            template_image.paste(product_image_resized, paste_position, product_image_resized)
+            draw = ImageDraw.Draw(template_image)
+            try:
+                font_name = ImageFont.truetype("assets/Montserrat-Bold.ttf", 47)
+                font_price_from = ImageFont.truetype("assets/Montserrat-Regular.ttf", 28)
+                font_price = ImageFont.truetype("assets/Montserrat-Bold.ttf", 47)
+                font_cupom = ImageFont.truetype("assets/Montserrat-Bold.ttf", 33)
+            except IOError:
+                print("Arial font not found. Using default font.")
+                font_name = ImageFont.load_default()
+                font_price_from = ImageFont.load_default()
+                font_price = ImageFont.load_default()
+                font_cupom = ImageFont.load_default()
+            white_color = "#FFFFFF"
+            yellow_color = "#FEE161"
+            black_color = "#000000"
+            draw.text((360, 710), product_name, font=font_name, fill=white_color, anchor="ms")
+            draw.text((360, 800), original_price, font=font_price_from, fill=white_color, anchor="ms")
+            draw.text((360, 860), final_price, font=font_price, fill=yellow_color, anchor="ms")
+            draw.text((360, 993), coupon_code, font=font_cupom, fill=black_color, anchor="ms")
+            template_image.save(output_path)
+            return output_path
+        except FileNotFoundError:
+            return f"Error: The template file '{template_path}' was not found."
+        except Exception as e:
+            return f"An error occurred: {e}"

main.py ADDED Viewed

	@@ -0,0 +1,66 @@

+import os
+import csv
+from dotenv import load_dotenv
+from social_media_crew import SocialMediaCrew
+import mlflow
+mlflow.crewai.autolog()
+# Optional: Set a tracking URI and an experiment name if you have a tracking server
+mlflow.set_tracking_uri("http://localhost:5000")
+mlflow.set_experiment("CrewAI")
+# Load environment variables from .env file
+load_dotenv()
+# Now you can safely access the API key
+# Make sure your .env file has OPENAI_API_KEY="your_key_here"
+api_key = os.getenv("OPENAI_API_KEY")
+natura_api_token = os.getenv("NATURA_API_TOKEN")
+if not api_key:
+    raise ValueError("OPENAI_API_KEY not found in .env file or environment variables.")
+if not natura_api_token:
+    raise ValueError("NATURA_API_TOKEN not found in .env file or environment variables. Please set it for the URL shortener tool.")
+CSV_FILE = 'urls.csv'
+MARKDOWN_FILE = 'social_media_ads.md'
+all_results = []
+# Initialize the SocialMediaCrew
+social_media_crew = SocialMediaCrew()
+try:
+    with open(CSV_FILE, mode='r', encoding='utf-8') as file:
+        reader = csv.DictReader(file)
+        for row in reader:
+            current_url = row['url']
+            # Run the crew for the current URL
+            result = social_media_crew.run_crew(current_url)
+            print("######################")
+            print("Crew work finished for URL:", current_url)
+            print("Final result:")
+            print(result)
+            print("######################\n")
+            all_results.append({'url': current_url, 'ad': result})
+    # Write all results to a Markdown file
+    with open(MARKDOWN_FILE, mode='w', encoding='utf-8') as md_file:
+        md_file.write("# Social Media Ads for Perfumes\n\n")
+        for item in all_results:
+            md_file.write(f"## URL: {item['url']}\n\n")
+            md_file.write(f"{item['ad']}\n\n---\n\n")
+    print(f"All social media ads have been written to '{MARKDOWN_FILE}'")
+except FileNotFoundError:
+    print(f"Error: The CSV file '{CSV_FILE}' was not found. Please create it with a 'url' column.")
+except KeyError:
+    print(f"Error: The CSV file '{CSV_FILE}' must contain a 'url' column.")
+except Exception as e:
+    print(f"An unexpected error occurred: {e}")

merchs/merch.py ADDED Viewed

	@@ -0,0 +1,73 @@

+from abc import ABC, abstractmethod
+from shortener_tool import ShortenerTool
+class Merchant():
+    def __init__(self):
+        pass
+    @abstractmethod
+    def get_template(self, main_cupom, cupom_1, store = None) -> str:
+        pass
+    def get_css_selector(self) -> str:
+        return "body"
+    @abstractmethod
+    def shorten_url(self, url: str) -> str:
+        pass
+class NaturaMerchant(Merchant):
+    def __init__(self, natura_api_token: str):
+        super().__init__()
+        self.shortener_tool = ShortenerTool()
+    def get_template(self, main_cupom, cupom_1, store = None) -> str:
+        return f"""
+###Template:
+{{Title}}
+{{Description}}
+Preço original: ~~{{ORIGINAL PRICE}}~~
+**HOJE: {{CUPOM DISCOUNTED PRICE}} — {{TOTAL DISCOUNT PERCENTAGE}}% OFF**
+🎟️ CUPOM: {main_cupom} {'ou ' + cupom_1 if cupom_1 else ''}
+🛒 Compre aqui: {{short_url}}
+`⚠️ Faça login com o mesmo email e senha que já usa para comprar na Natura!`
+###End Template
+    """
+    def get_css_selector(self) -> str:
+        return ".product-detail-banner"
+    def shorten_url(self, url: str) -> str:
+        return self.shortener_tool.run(url)
+class MercadoLivreMerchant(Merchant):
+    def get_template(self, main_cupom, cupom_1, store = None) -> str:
+        return f"""
+###Template:
+{{Title}}
+(MERCADO LIVRE - {store.upper()} OFICIAL)
+{{Description}}
+Preço original: ~~{{ORIGINAL PRICE}}~~
+**HOJE: {{CUPOM DISCOUNTED PRICE}} — {{TOTAL DISCOUNT PERCENTAGE}}% OFF**
+🎟️ CUPOM: {main_cupom}
+🛒 Compre aqui: {{short_url}}
+`⚠️ Selecione a loja oficial {store.upper()}`
+###End Template
+   """
+    def get_css_selector(self) -> str:
+        return ".rl-card-featured"
+    def shorten_url(self, url: str) -> str:
+        return url

pyproject.toml CHANGED Viewed

@@ -10,6 +10,19 @@ dependencies = [
     "crewai-tools>=0.55.0",
     "gradio>=5.38.0",
     "litellm>=1.72.6",
     "playwright>=1.53.0",
     "playwright-stealth>=2.0.0",
 ]

     "crewai-tools>=0.55.0",
     "gradio>=5.38.0",
     "litellm>=1.72.6",
+    "pillow>=11.3.0",
     "playwright>=1.53.0",
     "playwright-stealth>=2.0.0",
+    "requests>=2.32.4",
 ]
+[dependency-groups]
+dev = [
+    "pytest>=8.4.1",
+]
+[tool.pytest.ini_options]
+pythonpath = [
+    ".",
+]
+testpaths = ["tests"]

scrape.py ADDED Viewed

	@@ -0,0 +1,46 @@

+import asyncio
+from playwright.async_api import async_playwright
+from playwright_stealth.stealth import Stealth
+from bs4 import BeautifulSoup
+async def main():
+    url = "https://www.fragrantica.com.br/perfume/Natura/Frescor-de-Cacau-25963.html"
+    async with Stealth().use_async(async_playwright()) as p:
+        browser = await p.chromium.launch(headless=True)
+        # Create the page from the stealthy context
+        page = await browser.new_page()
+        try:
+            print("Navigating to page with corrected stealth logic...")
+            await page.goto(url, timeout=120000)
+            print("Waiting for Cloudflare check/content load...")
+            main_content_selector = 'h1[itemprop="name"]'
+            await page.wait_for_selector(main_content_selector, timeout=60000)
+            print("✅ Cloudflare passed! Main content is visible.")
+            await page.screenshot(path='success_screenshot.png')
+            html_content = await page.content()
+            soup = BeautifulSoup(html_content, 'html.parser')
+            target_div = soup.find('div', class_='grid-x grid-margin-x')
+            if target_div:
+                div_string = target_div.prettify()
+                print("\n--- Targeted Div HTML Content ---")
+                print(div_string)
+            else:
+                print("❌ Could not find the <div class=\"grid-x grid-margin-x\"> tag.")
+        except Exception as e:
+            print(f"An error occurred: {e}")
+            await page.screenshot(path='error_screenshot.png')
+            print("Saved 'error_screenshot.png' for debugging.")
+        finally:
+            await browser.close()
+            print("\nBrowser closed.")
+if __name__ == "__main__":
+    asyncio.run(main())

stealth_scrape_tool.py CHANGED Viewed

@@ -16,8 +16,16 @@ class StealthScrapeTool(BaseTool):
                 await page.goto(website_url, timeout=120000)
-                # Wait for the specific element to be present
-                await page.wait_for_selector(css_element, timeout=60000)
                 html_content = await page.content()
                 soup = BeautifulSoup(html_content, 'html.parser')

                 await page.goto(website_url, timeout=120000)
+                try:
+                    # Wait for the specific element to be present
+                    await page.wait_for_selector(css_element, timeout=30000)
+                except Exception as e:
+                    # If timeout error, try again with "body" as css_element
+                    if "Timeout" in str(e) and css_element != "body":
+                        await page.wait_for_selector("body", timeout=60000)
+                        css_element = "body"
+                    else:
+                        raise e
                 html_content = await page.content()
                 soup = BeautifulSoup(html_content, 'html.parser')

test_tool.py ADDED Viewed

	@@ -0,0 +1,13 @@

+from image_generator_tool import GenerateImageTool
+tool = GenerateImageTool()
+result = tool._run(
+    product_image_url='https://production.na01.natura.com/on/demandware.static/-/Sites-natura-br-storefront-catalog/default/dw68595724/NATBRA-89834_1.jpg',
+    product_name="Homem Cor.agio",
+    original_price="De: R$ 399,00",
+    final_price="Por: R$ 167,92",
+    coupon_code="AGOSTOA"
+)
+print(result)

tests/test_utils_url_tool.py ADDED Viewed

	@@ -0,0 +1,38 @@

+import pytest
+from utils_tools import GetImageUrlTool
+def test_get_image_url_tool_success():
+    """Test that GetImageUrlTool correctly extracts product_id and returns the expected image URL."""
+    tool = GetImageUrlTool()
+    sample_url = "https://minhaloja.natura.com/p/refil-shampoo-mamae-e-bebe/NATBRA-92791?product=refil-shampoo-mamae-e-bebe&productId=NATBRA-92791&consultoria=lidimelocosmeticos&marca=natura"
+    expected_image_url = "https://production.na01.natura.com/on/demandware.static/-/Sites-natura-br-storefront-catalog/default/dw68595724/NATBRA-92791_1.jpg"
+    result = tool._run(sample_url)
+    assert result == expected_image_url
+def test_get_image_url_tool_different_id():
+    """Test with a different product_id to ensure extraction works generally."""
+    tool = GetImageUrlTool()
+    sample_url = "https://minhaloja.natura.com/p/some-product/NATBRA-12345?productId=NATBRA-12345"
+    expected_image_url = "https://production.na01.natura.com/on/demandware.static/-/Sites-natura-br-storefront-catalog/default/dw68595724/NATBRA-12345_1.jpg"
+    result = tool._run(sample_url)
+    assert result == expected_image_url
+def test_get_image_url_tool_invalid_input_type():
+    """Test that a ValueError is raised if product_url is not a string."""
+    tool = GetImageUrlTool()
+    with pytest.raises(ValueError, match="product_url must be a string."):
+        tool._run(12345)  # type: ignore
+def test_get_image_url_tool_missing_pattern():
+    """Test that a ValueError is raised if NATBRA-<digits> pattern is not found."""
+    tool = GetImageUrlTool()
+    invalid_url = "https://minhaloja.natura.com/p/some-product/INVALID-12345?productId=INVALID-12345"
+    with pytest.raises(ValueError, match="Could not extract product_id from the provided URL."):
+        tool._run(invalid_url)

utils_tools.py ADDED Viewed

	@@ -0,0 +1,119 @@

+import requests
+from crewai.tools import BaseTool
+import re
+from typing import Any
+from merchs.merch import Merchant, NaturaMerchant, MercadoLivreMerchant
+class CalculateDiscountedPriceTool(BaseTool):
+    """
+    A tool to calculate the final price of an item after a discount is applied.
+    """
+    name: str = "Calculate Discounted Price Tool"
+    description: str = "Calculates the price after applying a given discount percentage."
+    def _run(self, original_price: float, discount_percentage: float) -> float:
+        """Calculates the discounted price and the total discount amount.
+        This method takes an original price and a discount percentage, validates
+        the inputs, and then computes the final price after the discount is
+        applied, as well as the amount saved.
+        Args:
+            original_price: The initial price of the item as a float or integer.
+        Returns:
+            float:
+                - The final discounted price, rounded to 2 decimal places.
+        """
+        if not isinstance(original_price, (int, float)) or not isinstance(discount_percentage, (int, float)):
+            raise ValueError("Both original_price and discount_percentage must be numbers.")
+        if discount_percentage < 0 or discount_percentage > 100:
+            raise ValueError("Discount percentage must be between 0 and 100.")
+        discount_amount = original_price * (discount_percentage / 100)
+        discounted_price = original_price - discount_amount
+        return round(discounted_price, 2)
+class CalculateDiscountValueTool(BaseTool):
+    """
+    A tool to calculate the final discount value of an item after comparing the original value and the final value.
+    """
+    name: str = "Calculate Discount Value Tool"
+    description: str = "Calculates the discount value after comparing two values."
+    def _run(self, original_price: float, final_price: float) -> float:
+        """Calculates the total discounted amount give the original and final price.
+        This method takes an original price and a final price, validates
+        the inputs, and then computes the final discounted value.
+        Args:
+            original_price: The initial price of the item as a float or integer.
+            final_price: The final price after discount as a float or integer.
+        Returns:
+            float:
+                - The final discount value, rounded to 0 decimal places.
+        """
+        if not isinstance(original_price, (int, float)) or not isinstance(final_price, (int, float)):
+            raise ValueError("Both original_price and final_price must be numbers.")
+        discount_value = original_price - final_price
+        discount_percentage = (discount_value / original_price) * 100
+        return round(discount_percentage, 0)
+class GetImageUrlTool(BaseTool):
+    """
+    A tool to retrieve the image URL for a given product URL.
+    """
+    name: str = "Get Image URL Tool"
+    description: str = "Retrieves the image URL for a given product URL."
+    def _run(self, product_url: str) -> str:
+        """
+        Retrieves the image URL for a given product URL.
+        Example:
+            product_url = (
+                "https://minhaloja.natura.com/p/refil-shampoo-mamae-e-bebe/"
+                "NATBRA-92791?product=refil-shampoo-mamae-e-bebe&productId=NATBRA-92791"
+                "&consultoria=lidimelocosmeticos&marca=natura"
+            )
+            image_url = GetImageUrlTool()._run(product_url)
+            # Returns:
+            # "https://production.na01.natura.com/on/demandware.static/-/Sites-natura-br-storefront-catalog/default/dw68595724/NATBRA-92791_1.jpg"
+        """
+        if not isinstance(product_url, str):
+            raise ValueError("product_url must be a string.")
+        # Extract the numeric part after "NATBRA-" using a regular expression.
+        match = re.search(r"NATBRA-(\d+)", product_url)
+        if not match:
+            raise ValueError(
+                "Could not extract product_id from the provided URL. "
+                "Expected a pattern like 'NATBRA-<digits>'."
+            )
+        product_id = match.group(1)
+        # Build the final image URL.
+        image_url = (
+            f"https://production.na01.natura.com/on/demandware.static/-/Sites-natura-br-storefront-catalog/"
+            f"default/dw68595724/NATBRA-{product_id}_1.jpg"
+        )
+        return image_url
+class MerchantSelectorTool(BaseTool):
+    name: str = "Merchant Selector Tool"
+    description: str = "Selects the merchant based on url."
+    natura_api_token: str
+    def _run(self, original_url: str) -> Merchant:
+        if "mercadolivre" in original_url or "ml.com.br" in original_url:
+            return MercadoLivreMerchant()
+        elif "natura.com" in original_url:
+            return NaturaMerchant(natura_api_token=self.natura_api_token)
+        else:
+            raise ValueError("Unsupported merchant in URL.")

uv.lock CHANGED Viewed

@@ -574,8 +574,15 @@ dependencies = [
     { name = "crewai-tools" },
     { name = "gradio" },
     { name = "litellm" },
     { name = "playwright" },
     { name = "playwright-stealth" },
 ]
 [package.metadata]
@@ -585,10 +592,15 @@ requires-dist = [
     { name = "crewai-tools", specifier = ">=0.55.0" },
     { name = "gradio", specifier = ">=5.38.0" },
     { name = "litellm", specifier = ">=1.72.6" },
     { name = "playwright", specifier = ">=1.53.0" },
     { name = "playwright-stealth", specifier = ">=2.0.0" },
 ]
 [[package]]
 name = "crewai-tools"
 version = "0.55.0"
@@ -1261,6 +1273,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/a4/ed/1f1afb2e9e7f38a545d628f864d562a5ae64fe6f7a10e28ffb9b185b4e89/importlib_resources-6.5.2-py3-none-any.whl", hash = "sha256:789cfdc3ed28c78b67a06acb8126751ced69a3d5f79c095a98298cd8a760ccec", size = 37461, upload-time = "2025-01-03T18:51:54.306Z" },
 ]
 [[package]]
 name = "instructor"
 version = "1.10.0"
@@ -2430,6 +2451,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/b9/4e/c37ac19cea166a97de3a9690ad5ba340b3f4f4fcd5bf8237cedb2c2c7076/playwright_stealth-2.0.0-py3-none-any.whl", hash = "sha256:9eb3af1fd21619aac9fdd13a4a08141ed67159ac6310a94f7d2f758ba0cbe179", size = 32466, upload-time = "2025-06-18T03:54:53.394Z" },
 ]
 [[package]]
 name = "portalocker"
 version = "3.2.0"
@@ -2803,6 +2833,22 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/48/0a/c99fb7d7e176f8b176ef19704a32e6a9c6aafdf19ef75a187f701fc15801/pysbd-0.3.4-py3-none-any.whl", hash = "sha256:cd838939b7b0b185fcf86b0baf6636667dfb6e474743beeff878e9f42e022953", size = 71082, upload-time = "2021-02-11T16:36:33.351Z" },
 ]
 [[package]]
 name = "python-dateutil"
 version = "2.9.0.post0"

     { name = "crewai-tools" },
     { name = "gradio" },
     { name = "litellm" },
+    { name = "pillow" },
     { name = "playwright" },
     { name = "playwright-stealth" },
+    { name = "requests" },
+]
+[package.dev-dependencies]
+dev = [
+    { name = "pytest" },
 ]
 [package.metadata]
     { name = "crewai-tools", specifier = ">=0.55.0" },
     { name = "gradio", specifier = ">=5.38.0" },
     { name = "litellm", specifier = ">=1.72.6" },
+    { name = "pillow", specifier = ">=11.3.0" },
     { name = "playwright", specifier = ">=1.53.0" },
     { name = "playwright-stealth", specifier = ">=2.0.0" },
+    { name = "requests", specifier = ">=2.32.4" },
 ]
+[package.metadata.requires-dev]
+dev = [{ name = "pytest", specifier = ">=8.4.1" }]
 [[package]]
 name = "crewai-tools"
 version = "0.55.0"
     { url = "https://files.pythonhosted.org/packages/a4/ed/1f1afb2e9e7f38a545d628f864d562a5ae64fe6f7a10e28ffb9b185b4e89/importlib_resources-6.5.2-py3-none-any.whl", hash = "sha256:789cfdc3ed28c78b67a06acb8126751ced69a3d5f79c095a98298cd8a760ccec", size = 37461, upload-time = "2025-01-03T18:51:54.306Z" },
 ]
+[[package]]
+name = "iniconfig"
+version = "2.1.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/f2/97/ebf4da567aa6827c909642694d71c9fcf53e5b504f2d96afea02718862f3/iniconfig-2.1.0.tar.gz", hash = "sha256:3abbd2e30b36733fee78f9c7f7308f2d0050e88f0087fd25c2645f63c773e1c7", size = 4793, upload-time = "2025-03-19T20:09:59.721Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/2c/e1/e6716421ea10d38022b952c159d5161ca1193197fb744506875fbb87ea7b/iniconfig-2.1.0-py3-none-any.whl", hash = "sha256:9deba5723312380e77435581c6bf4935c94cbfab9b1ed33ef8d238ea168eb760", size = 6050, upload-time = "2025-03-19T20:10:01.071Z" },
+]
 [[package]]
 name = "instructor"
 version = "1.10.0"
     { url = "https://files.pythonhosted.org/packages/b9/4e/c37ac19cea166a97de3a9690ad5ba340b3f4f4fcd5bf8237cedb2c2c7076/playwright_stealth-2.0.0-py3-none-any.whl", hash = "sha256:9eb3af1fd21619aac9fdd13a4a08141ed67159ac6310a94f7d2f758ba0cbe179", size = 32466, upload-time = "2025-06-18T03:54:53.394Z" },
 ]
+[[package]]
+name = "pluggy"
+version = "1.6.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/f9/e2/3e91f31a7d2b083fe6ef3fa267035b518369d9511ffab804f839851d2779/pluggy-1.6.0.tar.gz", hash = "sha256:7dcc130b76258d33b90f61b658791dede3486c3e6bfb003ee5c9bfb396dd22f3", size = 69412, upload-time = "2025-05-15T12:30:07.975Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/54/20/4d324d65cc6d9205fabedc306948156824eb9f0ee1633355a8f7ec5c66bf/pluggy-1.6.0-py3-none-any.whl", hash = "sha256:e920276dd6813095e9377c0bc5566d94c932c33b27a3e3945d8389c374dd4746", size = 20538, upload-time = "2025-05-15T12:30:06.134Z" },
+]
 [[package]]
 name = "portalocker"
 version = "3.2.0"
     { url = "https://files.pythonhosted.org/packages/48/0a/c99fb7d7e176f8b176ef19704a32e6a9c6aafdf19ef75a187f701fc15801/pysbd-0.3.4-py3-none-any.whl", hash = "sha256:cd838939b7b0b185fcf86b0baf6636667dfb6e474743beeff878e9f42e022953", size = 71082, upload-time = "2021-02-11T16:36:33.351Z" },
 ]
+[[package]]
+name = "pytest"
+version = "8.4.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "colorama", marker = "sys_platform == 'win32'" },
+    { name = "iniconfig" },
+    { name = "packaging" },
+    { name = "pluggy" },
+    { name = "pygments" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/08/ba/45911d754e8eba3d5a841a5ce61a65a685ff1798421ac054f85aa8747dfb/pytest-8.4.1.tar.gz", hash = "sha256:7c67fd69174877359ed9371ec3af8a3d2b04741818c51e5e99cc1742251fa93c", size = 1517714, upload-time = "2025-06-18T05:48:06.109Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/29/16/c8a903f4c4dffe7a12843191437d7cd8e32751d5de349d45d3fe69544e87/pytest-8.4.1-py3-none-any.whl", hash = "sha256:539c70ba6fcead8e78eebbf1115e8b589e7565830d7d006a8723f19ac8a0afb7", size = 365474, upload-time = "2025-06-18T05:48:03.955Z" },
+]
 [[package]]
 name = "python-dateutil"
 version = "2.9.0.post0"