Spaces:

jdelavande
/

chat-ui-energy

Running on CPU Upgrade

nsarrazin commited on Feb 13

Commit

54a5aad

unverified ·

1 Parent(s): 3db4793

fix(hchat): update internal endpoint (#1716)

Files changed (2) hide show

chart/env/prod.yaml CHANGED Viewed

@@ -158,7 +158,7 @@ envVars:
         "endpoints": [
           {
             "type": "openai",
-            "baseURL": "https://proxy.serverless.api-inference.huggingface.tech/models/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B/v1"
           }
         ]
       },
@@ -192,7 +192,7 @@ envVars:
         "endpoints": [
           {
             "type": "openai",
-            "baseURL": "https://proxy.serverless.api-inference.huggingface.tech/models/nvidia/Llama-3.1-Nemotron-70B-Instruct-HF/v1"
           }
         ]
       },
@@ -260,7 +260,7 @@ envVars:
         "endpoints": [
           {
             "type": "openai",
-            "baseURL": "https://proxy.serverless.api-inference.huggingface.tech/models/Qwen/Qwen2.5-Coder-32B-Instruct/v1"
           }
         ]
       },
@@ -279,7 +279,7 @@ envVars:
         "endpoints": [
           {
             "type": "openai",
-            "baseURL": "https://proxy.serverless.api-inference.huggingface.tech/models/meta-llama/Llama-3.2-11B-Vision-Instruct/v1",
             "multimodal": {
               "image": {
                 "maxSizeInMB": 10,
@@ -596,7 +596,7 @@ envVars:
     ]
   HF_ORG_ADMIN: '644171cfbd0c97265298aa99'
   HF_ORG_EARLY_ACCESS: '5e67bd5b1009063689407478'
-  HF_API_ROOT: 'https://proxy.serverless.api-inference.huggingface.tech/models'
 infisical:
   enabled: true
   env: "prod-us-east-1"

         "endpoints": [
           {
             "type": "openai",
+            "baseURL": "https://internal.api-inference.huggingface.co/models/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B/v1"
           }
         ]
       },
         "endpoints": [
           {
             "type": "openai",
+            "baseURL": "https://internal.api-inference.huggingface.co/models/nvidia/Llama-3.1-Nemotron-70B-Instruct-HF/v1"
           }
         ]
       },
         "endpoints": [
           {
             "type": "openai",
+            "baseURL": "https://internal.api-inference.huggingface.co/models/Qwen/Qwen2.5-Coder-32B-Instruct/v1"
           }
         ]
       },
         "endpoints": [
           {
             "type": "openai",
+            "baseURL": "https://internal.api-inference.huggingface.co/models/meta-llama/Llama-3.2-11B-Vision-Instruct/v1",
             "multimodal": {
               "image": {
                 "maxSizeInMB": 10,
     ]
   HF_ORG_ADMIN: '644171cfbd0c97265298aa99'
   HF_ORG_EARLY_ACCESS: '5e67bd5b1009063689407478'
+  HF_API_ROOT: 'https://internal.api-inference.huggingface.co/models'
 infisical:
   enabled: true
   env: "prod-us-east-1"

scripts/updateLocalEnv.ts CHANGED Viewed

@@ -26,7 +26,7 @@ let full_config = `${PUBLIC_CONFIG}\n${SECRET_CONFIG}`;
 // replace the internal proxy url with the public endpoint
 full_config = full_config.replaceAll(
-	"https://proxy.serverless.api-inference.huggingface.tech",
 	"https://api-inference.huggingface.co"
 );

 // replace the internal proxy url with the public endpoint
 full_config = full_config.replaceAll(
+	"https://internal.api-inference.huggingface.co",
 	"https://api-inference.huggingface.co"
 );