Spaces:

TobDeBer
/

BPP_Gemma3_1b

Running

Tobias Bergmann commited on 3 days ago

Commit

b2df681

1 Parent(s): 95c291e

row2byrow pure C implementation

Files changed (2) hide show

app.py CHANGED Viewed

@@ -15,10 +15,12 @@ today_date = datetime.today().strftime("%B %-d, %Y")  # noqa: DTZ002
 SYS_PROMPT = f"""Today's Date: {today_date}.
 You are Gemma, developed by Google. You are a helpful AI assistant"""
-TITLE = "Gemma3 1b instruct IQ4_NL from local GGUF server"
 DESCRIPTION = """
 <p>Gemma3 1b instruct is an open-source LLM supporting a 128k context window. This demo uses only 2K context.
 </p>
 """
 LLAMA_CPP_SERVER = "http://127.0.0.1:8081"
 MAX_NEW_TOKENS = 1024

 SYS_PROMPT = f"""Today's Date: {today_date}.
 You are Gemma, developed by Google. You are a helpful AI assistant"""
+TITLE = "Gemma3 1b instruct IQ4_NL from local GGUF server using BPP library"
 DESCRIPTION = """
 <p>Gemma3 1b instruct is an open-source LLM supporting a 128k context window. This demo uses only 2K context.
 </p>
+<p> The BPP library implements matrix multiplication with far less multiplications.
+</p>
 """
 LLAMA_CPP_SERVER = "http://127.0.0.1:8081"
 MAX_NEW_TOKENS = 1024

llama-server CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b4c16c61eb6c544ee86e5557b44bd5ff253ba77a8e3f912d1c6312ec1820875b
-size 6358464

 version https://git-lfs.github.com/spec/v1
+oid sha256:3ead85d6cb439c1f7abfcd987bd19e125471e0350e9035f2edbc2ec25af1014d
+size 6362744