Spaces:

Manju017
/

AiravataModelTestRun

Runtime error

Manju017 commited on Oct 13, 2024

Commit

bce1941

verified ·

1 Parent(s): 1101f80

code to include the necessary imports and settings to use the Accelerate library effectively

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,30 +1,37 @@
 import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer
 model_name = "ai4bharat/Airavata"
-# Load the model in 8-bit precision to reduce memory usage
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
-    device_map="auto",
-    load_in_8bit=True
 )
-tokenizer = AutoTokenizer.from_pretrained(model_name)
-def generate_text(prompt, max_length):
     inputs = tokenizer(prompt, return_tensors="pt")
-    outputs = model.generate(**inputs, max_length=max_length)
     return tokenizer.decode(outputs[0], skip_special_tokens=True)
 interface = gr.Interface(
     fn=generate_text,
-    inputs=[
-        gr.inputs.Textbox(label="Enter your prompt"),
-        gr.inputs.Slider(10, 100, step=10, label="Max length")
-    ],
     outputs="text",
     title="Airavata Text Generation Model",
-    description="Generate text in Indic languages using the Airavata model."
 )
 interface.launch()

 import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer
+from accelerate import infer_auto_device_map
+# Load the model name
 model_name = "ai4bharat/Airavata"
+# Load the tokenizer
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+# Automatically determine the device map
+device_map = infer_auto_device_map(model_name)
+# Load the model with the device map
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
+    device_map=device_map,
+    load_in_8bit=True  # Use 8-bit precision for reduced memory usage
 )
+# Define the inference function
+def generate_text(prompt):
     inputs = tokenizer(prompt, return_tensors="pt")
+    outputs = model.generate(**inputs)
     return tokenizer.decode(outputs[0], skip_special_tokens=True)
+# Create the Gradio interface
 interface = gr.Interface(
     fn=generate_text,
+    inputs="text",
     outputs="text",
     title="Airavata Text Generation Model",
+    description="This is the AI4Bharat Airavata model for text generation in Indic languages."
 )
+# Launch the interface
 interface.launch()