TravelMate-AI / huggingface.yaml
bharadwaj-m's picture
First Commit
09aa2b8
sdk: gradio
sdk_version: 4.19.2
app_file: app.py
python_version: "3.10"
# Hardware requirements
hardware:
cpu: 2
memory: 16GB
# Build settings
build:
cuda: "None" # No CUDA needed for CPU-only
system_packages:
- build-essential
- python3-dev
- cmake
- pkg-config
- libopenblas-dev
- libomp-dev
# Environment variables
env:
- MODEL_NAME=meta-llama/Llama-2-7b-chat-hf
- EMBEDDING_MODEL=sentence-transformers/all-MiniLM-L6-v2
- SECRET_KEY=${SECRET_KEY}
- JWT_SECRET_KEY=${JWT_SECRET_KEY}
- RATE_LIMIT_REQUESTS=100
- RATE_LIMIT_WINDOW=3600
- LOG_LEVEL=INFO
# Dependencies
dependencies:
- gradio==4.19.2
- langchain==0.1.9
- langchain-core>=0.1.52,<0.2
- langchain-community==0.0.27
- langchain-text-splitters==0.0.1
- langchain-huggingface==0.0.3
- transformers==4.38.2
- torch==2.2.1
- accelerate==0.27.2
- bitsandbytes==0.42.0
- safetensors==0.4.2
- sentence-transformers==2.6.1
- faiss-cpu==1.7.4
- pydantic==2.5.3
- pydantic-settings==2.1.0
- python-dotenv==1.0.0
- fastapi==0.109.2
- uvicorn==0.27.1
- python-jose==3.3.0
- passlib==1.7.4
- python-multipart
- bcrypt==4.1.2
- httpx==0.26.0
- aiohttp==3.9.5
- tenacity==8.2.3
- cachetools==5.3.2
- numpy==1.26.3
- tqdm==4.66.1
- loguru==0.7.2
- datasets==2.16.1
- huggingface-hub==0.24.1
- circuitbreaker==1.4.0
# Health check
health_check:
path: /health
interval: 300
timeout: 10
retries: 3
# Resource limits
resources:
cpu: 2
memory: 16GB
# Cache settings
cache:
enabled: true
ttl: 3600
max_size: 1000
# Logging
logging:
level: INFO
format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
handlers:
- type: file
filename: app.log
max_bytes: 10485760
backup_count: 5
- type: stream
stream: ext://sys.stdout
# Space settings
space:
title: "TravelMate - AI Travel Assistant"
description: "An AI-powered travel assistant using Llama-2 and RAG to help plan trips and provide travel information"
license: mit
sdk: gradio
app_port: 7860
app_url: "https://huggingface.co/spaces/bharadwaj-m/TravelMate-AI"
# Build commands
build:
- pip install -r requirements.txt
- mkdir -p data/vector_store data/user_profiles data/cache
- python -c "from core.data_loader import DataLoader; DataLoader().initialize_knowledge_base()"
# Run command
run: python app.py