Spaces:

AnilNiraula
/

FinChat

Sleeping

App Files Files Community

AnilNiraula commited on Jul 5

Commit

862e37a

verified ·

1 Parent(s): 07e778c

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -10

app.py CHANGED Viewed

@@ -12,7 +12,7 @@ logger = logging.getLogger(__name__)
 device = torch.device("cpu")
 logger.info(f"Using device: {device}")
-# Response cache with new entry for step-by-step advice
 response_cache = {
     "hi": "Hello! I'm your financial advisor. How can I help with investing?",
     "hello": "Hello! I'm your financial advisor. How can I help with investing?",
@@ -83,7 +83,7 @@ except Exception as e:
     logger.error(f"Error loading model/tokenizer: {e}")
     raise
-# Pre-tokenize prompt prefix with improved few-shot example
 prompt_prefix = (
     "You are a financial advisor. Provide concise, actionable advice in a numbered list for step-by-step or idea prompts. "
     "Avoid repetition and vague statements. Use varied, specific steps.\n\n"
@@ -121,12 +121,12 @@ def chat_with_model(message, history=None):
         with torch.no_grad():
             outputs = model.generate(
                 **inputs,
-                max_new_tokens=100,  # Increased for detailed lists
-                min_length=20,  # Encourage substantive responses
-                do_sample=True,  # Sampling to avoid repetition
-                temperature=0.7,  # Balanced diversity
-                top_p=0.9,  # Nucleus sampling
-                no_repeat_ngram_size=2,  # Prevent repetitive phrases
                 pad_token_id=tokenizer.eos_token_id
             )
         response = tokenizer.decode(outputs[0], skip_special_tokens=True)
@@ -153,7 +153,12 @@ interface = gr.ChatInterface(
 )
 # Launch interface (conditional for Spaces)
-if __name__ == "__main__ and not os.getenv("HF_SPACE"):
     logger.info("Launching Gradio interface locally")
     try:
-        interface.launch(

 device = torch.device("cpu")
 logger.info(f"Using device: {device}")
+# Response cache with step-by-step advice
 response_cache = {
     "hi": "Hello! I'm your financial advisor. How can I help with investing?",
     "hello": "Hello! I'm your financial advisor. How can I help with investing?",
     logger.error(f"Error loading model/tokenizer: {e}")
     raise
+# Pre-tokenize prompt prefix with few-shot example
 prompt_prefix = (
     "You are a financial advisor. Provide concise, actionable advice in a numbered list for step-by-step or idea prompts. "
     "Avoid repetition and vague statements. Use varied, specific steps.\n\n"
         with torch.no_grad():
             outputs = model.generate(
                 **inputs,
+                max_new_tokens=100,
+                min_length=20,
+                do_sample=True,
+                temperature=0.7,
+                top_p=0.9,
+                no_repeat_ngram_size=2,
                 pad_token_id=tokenizer.eos_token_id
             )
         response = tokenizer.decode(outputs[0], skip_special_tokens=True)
 )
 # Launch interface (conditional for Spaces)
+if __name__ == "__main__" and not os.getenv("HF_SPACE"):
     logger.info("Launching Gradio interface locally")
     try:
+        interface.launch(share=False, debug=True)
+    except Exception as e:
+        logger.error(f"Error launching interface: {e}")
+        raise
+else:
+    logger.info("Running in Hugging Face Spaces, interface defined but not launched")