Spaces:

Viraj2307
/

Fine-Tune-LLM

Sleeping

App Files Files Community

viraj commited on Nov 22, 2024

Commit

dacf14a

1 Parent(s): e5afeb9

Initial Commit

Browse files

Files changed (27) hide show

.gitignore +14 -0
FineTuning.ipynb +0 -0
Makefile +13 -0
backend/.DS_Store +0 -0
backend/Dockerfile +10 -0
backend/README.md +0 -0
backend/__init__.py +0 -0
backend/app/__init__.py +1 -0
backend/app/api/__init__.py +0 -0
backend/app/api/v1/__init__.py +0 -0
backend/app/api/v1/config.py +20 -0
backend/app/api/v1/qa.py +21 -0
backend/app/api/v1/schemas.py +7 -0
backend/app/main.py +12 -0
backend/app/models.py +23 -0
backend/app/schemas.py +7 -0
backend/requirements.txt +6 -0
backend/tests/__init__.py +0 -0
backend/tests/test_config.py +10 -0
backend/tests/test_qa.py +11 -0
docker-compose.yml +22 -0
frontend/.streamlit/config.toml +4 -0
frontend/Dockerfile +10 -0
frontend/README.md +0 -0
frontend/app.py +23 -0
frontend/requirements.txt +4 -0
setup_template.py +52 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,14 @@

+/env
+__pycache__/
+*.pyc
+*.pyo
+*.pyd
+*.db
+*.sqlite
+.env
+venv/
+*.log
+/venv
+/.venv
+.venv
+backend/fine-tuned-model

FineTuning.ipynb ADDED Viewed

The diff for this file is too large to render. See raw diff

Makefile ADDED Viewed

	@@ -0,0 +1,13 @@

+# Define variables for backend and frontend directories
+BACKEND_DIR = backend
+FRONTEND_DIR = frontend
+start-backend:
+	cd $(BACKEND_DIR) && pip3 install -r requirements.txt && uvicorn app.main:app --host 0.0.0.0 --port 8000
+start-frontend:
+	cd $(FRONTEND_DIR) && pip3 install -r requirements.txt && streamlit run app.py
+up:
+	$(MAKE) start-backend &
+	$(MAKE) start-frontend

backend/.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

backend/Dockerfile ADDED Viewed

	@@ -0,0 +1,10 @@

+FROM python:3.11-slim
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY app /app
+CMD ["uvicorn", "app.main:app", "--host", "0.0.0.0", "--port", "8000"]

backend/README.md ADDED Viewed

File without changes

backend/__init__.py ADDED Viewed

File without changes

backend/app/__init__.py ADDED Viewed

	@@ -0,0 +1 @@


1	+ from .models import predict_sentiment

backend/app/api/__init__.py ADDED Viewed

File without changes

backend/app/api/v1/__init__.py ADDED Viewed

File without changes

backend/app/api/v1/config.py ADDED Viewed

	@@ -0,0 +1,20 @@

+from fastapi import APIRouter, HTTPException
+from .schemas import ConfigRequest
+from transformers import AutoModelForQuestionAnswering, AutoTokenizer, pipeline, AutoModelForSequenceClassification
+from app.models import predict_sentiment
+router = APIRouter()
+model_name = "fine-tuned-model"
+tokenizer = AutoTokenizer.from_pretrained(model_name, use_safetensors=True)
+model = AutoModelForSequenceClassification.from_pretrained(model_name)
+@router.post("/")
+def configure_model(config: ConfigRequest):
+    global model, tokenizer, qa_pipeline
+    try:
+        model = AutoModelForQuestionAnswering.from_pretrained(config.model_name)
+        tokenizer = AutoTokenizer.from_pretrained(config.model_name)
+        return {"message": f"Model loaded successfully: {config.model_name}"}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))

backend/app/api/v1/qa.py ADDED Viewed

	@@ -0,0 +1,21 @@

+from fastapi import APIRouter, HTTPException
+from .schemas import QARequest
+from transformers import AutoModelForSequenceClassification
+from transformers import AutoModelForQuestionAnswering, AutoTokenizer
+from app.models import predict_sentiment
+router = APIRouter()
+model_name = "fine-tuned-model"
+tokenizer = AutoTokenizer.from_pretrained(model_name, use_safetensors=True)
+model = AutoModelForSequenceClassification.from_pretrained(model_name)
+@router.post("/")
+def get_answer(request: QARequest):
+    try:
+        sentiment, probs = predict_sentiment(request.command)
+        probs = [float(prob) for prob in probs]
+        print({"review": request.command, "sentiment": sentiment, "probs": probs})
+        return {"review": request.command, "sentiment": sentiment, "probs": probs}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))

backend/app/api/v1/schemas.py ADDED Viewed

	@@ -0,0 +1,7 @@

+from pydantic import BaseModel
+class QARequest(BaseModel):
+    command: str
+class ConfigRequest(BaseModel):
+    model_name: str

backend/app/main.py ADDED Viewed

	@@ -0,0 +1,12 @@

+from fastapi import FastAPI
+from .api.v1 import qa, config
+app = FastAPI()
+# Include routers for the API
+app.include_router(qa.router, prefix="/qa", tags=["qa"])
+app.include_router(config.router, prefix="/config", tags=["config"])
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=8000, reload=True)

backend/app/models.py ADDED Viewed

	@@ -0,0 +1,23 @@

+from transformers import AutoTokenizer, AutoModelForSequenceClassification
+import torch
+import os
+model_name = "fine-tuned-model"
+tokenizer = AutoTokenizer.from_pretrained(model_name, use_safetensors=True)
+model = AutoModelForSequenceClassification.from_pretrained(model_name)
+device = torch.device("cpu")
+def predict_sentiment(review_text):
+    inputs = tokenizer(review_text, padding=True, truncation=True, return_tensors="pt").to(device)
+    with torch.no_grad():
+        outputs = model(**inputs)
+    logits = outputs.logits
+    predictions = torch.softmax(logits, dim=-1)
+    predicted_label = torch.argmax(predictions, dim=-1).item()
+    sentiment = "Positive" if predicted_label == 1 else "Negative"
+    return sentiment, predictions[0].cpu().numpy()

backend/app/schemas.py ADDED Viewed

	@@ -0,0 +1,7 @@

+from pydantic import BaseModel
+class QARequest(BaseModel):
+    command: str
+class ConfigRequest(BaseModel):
+    model_name: str

backend/requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+fastapi==0.95.2
+uvicorn==0.22.0
+transformers==4.34.0
+torch==2.3.1
+pydantic==1.10.7
+requests==2.31.0

backend/tests/__init__.py ADDED Viewed

File without changes

backend/tests/test_config.py ADDED Viewed

	@@ -0,0 +1,10 @@

+import pytest
+from fastapi.testclient import TestClient
+from backend.app.main import app
+client = TestClient(app)
+def test_configure_model():
+    response = client.post("/config/", json={"model_name": "distilbert-base-uncased-distilled-squad"})
+    assert response.status_code == 200
+    assert "message" in response.json()

backend/tests/test_qa.py ADDED Viewed

	@@ -0,0 +1,11 @@

+import pytest
+from fastapi.testclient import TestClient
+from backend.app.main import app
+client = TestClient(app)
+def test_get_answer():
+    response = client.post("/qa/", json={"context": "Hello world", "question": "What is this?"})
+    assert response.status_code == 200
+    assert "answer" in response.json()
+    assert "score" in response.json()

docker-compose.yml ADDED Viewed

	@@ -0,0 +1,22 @@

+version: '3.11'
+services:
+  backend:
+    build:
+      context: ./backend
+    ports:
+      - "8000:8000"
+    volumes:
+      - ./backend:/app
+  frontend:
+    build:
+      context: ./frontend
+    ports:
+      - "8501:8501"
+    volumes:
+      - ./frontend:/app
+    environment:
+      - API_URL=http://0.0.0.0:8000
+    depends_on:
+      - backend

frontend/.streamlit/config.toml ADDED Viewed

	@@ -0,0 +1,4 @@

+[theme]
+base="dark"
+primaryColor="#00b4ff"
+backgroundColor="#000000"

frontend/Dockerfile ADDED Viewed

	@@ -0,0 +1,10 @@

+FROM python:3.11-slim
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY app.py /app
+CMD ["streamlit", "run", "app.py", "--server.port", "8501"]

frontend/README.md ADDED Viewed

File without changes

frontend/app.py ADDED Viewed

	@@ -0,0 +1,23 @@

+import streamlit as st
+import requests
+API_URL = "http://localhost:8000"
+st.title("BERT Fine Tuned Model on IMBD dataset")
+st.header("try with reviews")
+question = st.text_input("Review")
+if st.button("Get Answer"):
+    if question:
+        print(f"{API_URL}/qa/")
+        response = requests.post(f"{API_URL}/qa/", json={"command": question})
+        if response.status_code == 200:
+            answer = response.json()
+            st.write(f"**Review**: {answer['review']}")
+            st.write(f"**Sentiment**: {answer['sentiment']}")
+            st.write(f"**Probs**: {answer['probs']}")
+        else:
+            st.error(f"Error: {response.json().get('detail', 'Unknown error')}")
+    else:
+        st.error("Please provide both context and question.")

frontend/requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+streamlit==1.37.0
+pandas==2.2.2
+requests==2.31.0

setup_template.py ADDED Viewed

	@@ -0,0 +1,52 @@

+import os
+from pathlib import Path
+import logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='[%(asctime)s]: %(message)s',
+)
+project_name = 'my_project'
+list_of_files = [
+    # Backend
+    f"backend/app/__init__.py",
+    f"backend/app/main.py",
+    f"backend/app/models.py",
+    f"backend/app/schemas.py",
+    f"backend/app/api/__init__.py",
+    f"backend/app/api/v1/__init__.py",
+    f"backend/app/api/v1/qa.py",
+    f"backend/app/api/v1/config.py",
+    f"backend/tests/__init__.py",
+    f"backend/tests/test_qa.py",
+    f"backend/tests/test_config.py",
+    f"backend/Dockerfile",
+    f"backend/requirements.txt",
+    f"backend/README.md",
+    # Frontend
+    f"frontend/app.py",
+    f"frontend/Dockerfile",
+    f"frontend/requirements.txt",
+    f"frontend/README.md",
+    # Root
+    ".gitignore",
+    "README.md"
+]
+for path in list_of_files:
+    file_path = Path(path)
+    filedir, filename = os.path.split(file_path)
+    if filedir != "":
+        os.makedirs(filedir, exist_ok=True)
+        logging.info(f"Created directory {filedir}")
+    if (not os.path.exists(file_path)) or (os.path.getsize(file_path) == 0):
+        with open(file_path, "w") as f:
+            pass
+            logging.info(f"Created file {filename}")
+    else:
+        logging.info(f"File {filename} already exists")