Spaces:
Runtime error
Runtime error
Commit
·
9f88a9b
1
Parent(s):
b28b3e5
Update app.py
Browse files
app.py
CHANGED
@@ -22,7 +22,7 @@ def init_args():
|
|
22 |
args.batch_size = 1
|
23 |
args.seq_length = 512
|
24 |
args.world_size = 1
|
25 |
-
args.use_int8 =
|
26 |
args.top_p = 0
|
27 |
args.repetition_penalty_range = 1024
|
28 |
args.repetition_penalty_slope = 0
|
@@ -40,11 +40,12 @@ def init_model():
|
|
40 |
model = LLaMa(args)
|
41 |
torch.set_default_tensor_type(torch.FloatTensor)
|
42 |
model = load_model(model, args.load_model_path)
|
43 |
-
print('
|
44 |
model.eval()
|
45 |
|
46 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
47 |
model.to(device)
|
|
|
48 |
lm_generation = LmGeneration(model, args.tokenizer)
|
49 |
|
50 |
|
|
|
22 |
args.batch_size = 1
|
23 |
args.seq_length = 512
|
24 |
args.world_size = 1
|
25 |
+
args.use_int8 = True
|
26 |
args.top_p = 0
|
27 |
args.repetition_penalty_range = 1024
|
28 |
args.repetition_penalty_slope = 0
|
|
|
40 |
model = LLaMa(args)
|
41 |
torch.set_default_tensor_type(torch.FloatTensor)
|
42 |
model = load_model(model, args.load_model_path)
|
43 |
+
print('load model done.')
|
44 |
model.eval()
|
45 |
|
46 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
47 |
model.to(device)
|
48 |
+
print('to cuda.')
|
49 |
lm_generation = LmGeneration(model, args.tokenizer)
|
50 |
|
51 |
|