Spaces:

CreitinGameplays
/

bloom-3b-conversational-gradio

Sleeping

CreitinGameplays commited on Apr 12, 2024

Commit

3cfe997

verified ·

1 Parent(s): 77fc397

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,7 +3,6 @@ import torch
 import bitsandbytes as bnb
 from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
-"""
 # BNB config
 bnb_config = BitsAndBytesConfig(
     load_in_4bit=True,
@@ -12,15 +11,14 @@ bnb_config = BitsAndBytesConfig(
     bnb_4bit_compute_dtype=torch.bfloat16
 )
-quantization_config=bnb_config
-"""
 # Define the BLOOM model name
 model_name = "CreitinGameplays/bloom-3b-conversational"
 # Load tokenizer and model
 tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForCausalLM.from_pretrained(model_name)
 def generate_text(user_prompt):
   """Generates text using the BLOOM model from Hugging Face Transformers and removes the user prompt."""

 import bitsandbytes as bnb
 from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
 # BNB config
 bnb_config = BitsAndBytesConfig(
     load_in_4bit=True,
     bnb_4bit_compute_dtype=torch.bfloat16
 )
+#quantization_config=bnb_config
 # Define the BLOOM model name
 model_name = "CreitinGameplays/bloom-3b-conversational"
 # Load tokenizer and model
 tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name, quantization_config=bnb_config)
 def generate_text(user_prompt):
   """Generates text using the BLOOM model from Hugging Face Transformers and removes the user prompt."""