DavidBrowne17 commited on
Commit
65e5d19
·
verified ·
1 Parent(s): 4432acb

Upload 4 files

Browse files
config.yaml ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ seed: 999
2
+ cudnn_deterministic: false
3
+ train_data_jsons:
4
+ - data/train/1splits/data.0.tiny.json
5
+ valid_data_jsons:
6
+ - data/val/1splits/data.0.tiny.json
7
+ batch_scale: 2000
8
+ max_length: 1500
9
+ min_length: 1
10
+ n_worker: 4
11
+ local_rank: -1
12
+ minibatch_debug: -1
13
+ n_epoch: 1
14
+ grad_accum: 64
15
+ global_learning_rate: 2.0e-06
16
+ local_learning_rate: 4.0e-06
17
+ grad_clip: 2.0
18
+ warmup_steps: 10000
19
+ total_steps: 55
20
+ dim: 4096
21
+ text_card: 1
22
+ existing_text_padding_id: 3
23
+ n_q: 16
24
+ dep_q: 8
25
+ card: 2048
26
+ num_heads: 32
27
+ num_layers: 32
28
+ hidden_scale: 4.5
29
+ causal: true
30
+ context: 3000
31
+ exp_dir: exp_data/Moshi/v3_full_emo_v0
32
+ print_freq: 5
33
+ save_interval: 10000
34
+ resume: null
35
+ merged_model_path: exp_data/Moshi/v3_full_emo_v0/model_merged.safetensors
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c08e186a7f0f051c2017095da0f79d9f5007255aabbdd140d08e6cc979d7a3e
3
+ size 15375499776
tokenizer-e351c8d8-checkpoint125.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09b782f0629851a271227fb9d36db65c041790365f11bbe5d3d59369cf863f50
3
+ size 384644900
tokenizer_spm_32k_3.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d4336533ddc26f9acf7250d7fb83492152196c6ea4212c841df76933f18d2d
3
+ size 552778