Spaces:

Nitzantry1
/

try3

Sleeping

Nitzantry1 commited on Oct 14, 2024

Commit

8106ffa

verified ·

1 Parent(s): c102310

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -17,22 +17,13 @@ device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 print('Using device:', device)
 print()
-# יצירת המנוע עם Accelerate במידת הצורך
-if device.type == 'cuda':
-    generator = pipeline('text-generation', model=model_id,
-                         tokenizer=model_id,
-                         torch_dtype=torch.float16,
-                         use_fast=should_use_fast,
-                         trust_remote_code=True,
-                         device_map="auto")
-else:
-    from accelerate import init_empty_weights, infer_auto_device_map
-    from transformers import AutoModelForCausalLM, AutoTokenizer
-    tokenizer = AutoTokenizer.from_pretrained(model_id, use_fast=should_use_fast)
-    with init_empty_weights():
-        model = AutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=True)
-    generator = pipeline('text-generation', model=model, tokenizer=tokenizer, device=device)
 # פונקציית יצירת הטקסט
 def chat_with_model(history):

 print('Using device:', device)
 print()
+# יצירת המנוע עם pipeline
+generator = pipeline('text-generation', model=model_id,
+                     tokenizer=model_id,
+                     torch_dtype=torch.float16 if device.type == 'cuda' else torch.float32,
+                     use_fast=should_use_fast,
+                     trust_remote_code=True,
+                     device_map="auto" if device.type == 'cuda' else None)
 # פונקציית יצירת הטקסט
 def chat_with_model(history):