Spaces:

SPBhai
/

BG_CHATBOT_RAG

Runtime error

SPBhai commited on Jan 21

Commit

6d76007

verified ·

1 Parent(s): 909c589

Loading the model without quantization

Files changed (1) hide show

app.py CHANGED Viewed

@@ -31,11 +31,10 @@ similarity_retriever = vector_store.as_retriever(
 )
 # Load the LLM
-quantization_config = BitsAndBytesConfig(load_in_8bit=True, device = "cpu")
 tokenizer = AutoTokenizer.from_pretrained("google/gemma-2-9b-it")
 llm_model = AutoModelForCausalLM.from_pretrained(
-    "google/gemma-2-9b-it",
-    quantization_config=quantization_config,
 )
 text_generation_pipeline = pipeline(
     model=llm_model,

 )
 # Load the LLM
+# quantization_config = BitsAndBytesConfig(load_in_8bit=True, device = "cpu")
 tokenizer = AutoTokenizer.from_pretrained("google/gemma-2-9b-it")
 llm_model = AutoModelForCausalLM.from_pretrained(
+    "google/gemma-2-9b-it"
 )
 text_generation_pipeline = pipeline(
     model=llm_model,