padmanabhbosamia commited on
Commit
2e9b2d7
·
verified ·
1 Parent(s): e9026bb

Changes to bit and bytes

Browse files
Files changed (2) hide show
  1. app.py +2 -0
  2. requirements.txt +11 -9
app.py CHANGED
@@ -16,6 +16,7 @@ model = AutoModelForCausalLM.from_pretrained(
16
  device_map="auto",
17
  trust_remote_code=True,
18
  torch_dtype=torch.float16, # Use float16 for memory efficiency
 
19
  )
20
  tokenizer = AutoTokenizer.from_pretrained("./fine-tuned-model")
21
  tokenizer.pad_token = tokenizer.eos_token
@@ -28,6 +29,7 @@ base_model = AutoModelForCausalLM.from_pretrained(
28
  device_map="auto",
29
  trust_remote_code=True,
30
  torch_dtype=torch.float16,
 
31
  )
32
 
33
  def generate_response(
 
16
  device_map="auto",
17
  trust_remote_code=True,
18
  torch_dtype=torch.float16, # Use float16 for memory efficiency
19
+ low_cpu_mem_usage=True, # Add this for better memory handling
20
  )
21
  tokenizer = AutoTokenizer.from_pretrained("./fine-tuned-model")
22
  tokenizer.pad_token = tokenizer.eos_token
 
29
  device_map="auto",
30
  trust_remote_code=True,
31
  torch_dtype=torch.float16,
32
+ low_cpu_mem_usage=True, # Add this for better memory handling
33
  )
34
 
35
  def generate_response(
requirements.txt CHANGED
@@ -1,12 +1,14 @@
1
  torch>=2.0.0
2
- transformers>=4.30.0
3
- datasets>=2.12.0
4
- accelerate>=0.20.0
5
- bitsandbytes>=0.41.0
6
- peft>=0.4.0
7
- pytorch-lightning>=2.0.0
8
- gradio>=3.40.0
9
- wandb>=0.15.0
10
- rich>=13.0.0
 
 
11
  sentencepiece>=0.1.99
12
  protobuf>=4.23.0
 
1
  torch>=2.0.0
2
+ transformers>=4.36.0
3
+ datasets>=2.14.0
4
+ accelerate>=0.25.0
5
+ peft>=0.7.0
6
+ trl>=0.7.4
7
+ wandb>=0.16.0
8
+ gradio>=4.0.0
9
+ rich>=13.7.0
10
+ numpy>=1.24.0
11
+ tqdm>=4.66.0
12
+ scipy>=1.11.0
13
  sentencepiece>=0.1.99
14
  protobuf>=4.23.0