perplexity-chat

Running

BotifyCloudAdmin commited on Jan 31

Commit

d6b7bed

verified ·

1 Parent(s): e73ae5f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,11 +10,16 @@ AVAILABLE_MODELS = {
     "Llama3.1-8b-Instruct": "meta-llama/Meta-Llama-3.1-8B-Instruct",
 }
-ENDPOINT_URL = "https://api.hyperbolic.xyz/v1"
-OAI_API_KEY = os.getenv('HYPERBOLIC_XYZ_KEY')
 PASSWORD = os.getenv("PASSWD")  # Store the password in an environment variable
-client = OpenAI(base_url=ENDPOINT_URL, api_key=OAI_API_KEY)
 def respond(
     message: str,
@@ -34,7 +39,13 @@ def respond(
     messages.append({"role": "user", "content": message})
     response = ""
-    for chunk in client.chat.completions.create(
         model=AVAILABLE_MODELS[model_choice],  # Use the selected model
         messages=messages,
         max_tokens=max_tokens,

     "Llama3.1-8b-Instruct": "meta-llama/Meta-Llama-3.1-8B-Instruct",
 }
+HYPERB_ENDPOINT_URL = "https://api.hyperbolic.xyz/v1"
+HF_ENDPOINT_URL = "https://huggingface.co/api/inference-proxy/together"
+HYPERB_API_KEY = os.getenv('HYPERBOLIC_XYZ_KEY')
+HF_API_KEY = os.getenv('HF_KEY')
 PASSWORD = os.getenv("PASSWD")  # Store the password in an environment variable
+DEPLOY_TO_HF = ["deepseek-ai/DeepSeek-V3"]
+hyperb_client = OpenAI(base_url=HYPERB_ENDPOINT_URL, api_key=HYPERB_API_KEY)
+hf_client = OpenAI(base_url=HF_ENDPOINT_URL, api_key=HF_API_KEY)
 def respond(
     message: str,
     messages.append({"role": "user", "content": message})
     response = ""
+    if model_choice in DEPLOY_TO_HF:
+        this_client = hf_client
+    else:
+        this_client = hyperb_client
+    for chunk in this_client.chat.completions.create(
         model=AVAILABLE_MODELS[model_choice],  # Use the selected model
         messages=messages,
         max_tokens=max_tokens,