Spaces:
Sleeping
Sleeping
Commit
·
6c32632
1
Parent(s):
3e32321
Add comment about adaptability
Browse files
utils.py
CHANGED
|
@@ -7,6 +7,7 @@ from llama_cpp import json_schema_to_gbnf
|
|
| 7 |
# The llama_cpp Python HTTP server communicates with the AI model, similar
|
| 8 |
# to the OpenAI API but adds a unique "grammar" parameter.
|
| 9 |
# The real OpenAI API has other ways to set the output format.
|
|
|
|
| 10 |
|
| 11 |
URL = "http://localhost:5834/v1/chat/completions"
|
| 12 |
|
|
|
|
| 7 |
# The llama_cpp Python HTTP server communicates with the AI model, similar
|
| 8 |
# to the OpenAI API but adds a unique "grammar" parameter.
|
| 9 |
# The real OpenAI API has other ways to set the output format.
|
| 10 |
+
# It's possible to switch to another LLM API by changing the llm_streaming function.
|
| 11 |
|
| 12 |
URL = "http://localhost:5834/v1/chat/completions"
|
| 13 |
|