CISCai
/

gorilla-openfunctions-v2-SOTA-GGUF

Text Generation

GGUF

English

Inference Endpoints

conversational

Model card Files Files and versions Community

CISCai commited on May 25, 2024

Commit

639a998

verified ·

1 Parent(s): fe2973a

Add grammar example

Browse files

Files changed (1) hide show

README.md +74 -5

README.md CHANGED Viewed

@@ -160,15 +160,33 @@ pip install llama-cpp-python
 ```python
 from llama_cpp import Llama
 # Chat Completion API
 llm = Llama(model_path="./gorilla-openfunctions-v2.IQ3_M.gguf", n_gpu_layers=33, n_ctx=16384, temperature=0.0, repeat_penalty=1.1)
-print(llm.create_chat_completion(
       messages = [
         {
           "role": "user",
-          "content": "What's the weather like in Oslo?"
         }
       ],
       tools=[{
@@ -192,12 +210,63 @@ print(llm.create_chat_completion(
           }
         }
       }],
-      tool_choice={
         "type": "function",
         "function": {
-          "name": "get_current_weather"
         }
-      }
 ))
 ```

 ```python
 from llama_cpp import Llama
+from llama_cpp.llama_grammar import LlamaGrammar
+import json
 # Chat Completion API
+grammar = LlamaGrammar.from_json_schema(json.dumps({
+    "type": "array",
+    "items": {
+        "type": "object",
+        "required": [ "name", "arguments" ],
+        "properties": {
+            "name": {
+                "type": "string"
+            },
+            "arguments": {
+                "type": "object"
+            }
+        }
+    }
+}))
 llm = Llama(model_path="./gorilla-openfunctions-v2.IQ3_M.gguf", n_gpu_layers=33, n_ctx=16384, temperature=0.0, repeat_penalty=1.1)
+response = llm.create_chat_completion(
       messages = [
         {
           "role": "user",
+          "content": "What's the weather like in Oslo and Stockholm?"
         }
       ],
       tools=[{
           }
         }
       }],
+      grammar = grammar
+)
+print(json.loads(response["choices"][0]["text"]))
+print(llm.create_chat_completion(
+      messages = [
+        {
+          "role": "user",
+          "content": "What's the weather like in Oslo and Stockholm?"
+        },
+        { # The tool_calls is from the response to the above with tool_choice active
+          "role": "assistant",
+          "content": None,
+          "tool_calls": [
+            {
+              "id": "call__0_get_current_weather_cmpl-...",
+              "type": "function",
+              "function": {
+                "name": "get_current_weather",
+                "arguments": '{ "location": "Oslo, NO" ,"unit": "celsius"} '
+              }
+            }
+          ]
+        },
+        { # The tool_call_id is from tool_calls and content is the result from the function call you made
+          "role": "tool",
+          "content": 20,
+          "tool_call_id": "call__0_get_current_weather_cmpl-..."
+        }
+      ],
+      tools=[{
         "type": "function",
         "function": {
+          "name": "get_current_weather",
+          "description": "Get the current weather in a given location",
+          "parameters": {
+            "type": "object",
+            "properties": {
+              "location": {
+                "type": "string",
+                "description": "The city and state, e.g. San Francisco, CA"
+              },
+              "unit": {
+                "type": "string",
+                "enum": [ "celsius", "fahrenheit" ]
+              }
+            },
+            "required": [ "location" ]
+          }
         }
+      }],
+      #tool_choice={
+      #  "type": "function",
+      #  "function": {
+      #    "name": "get_current_weather"
+      #  }
+      #}
 ))
 ```