Text Generation
Transformers
Safetensors
llama
model: vicuna
repo_name: vicuna_channel_4_salient_translation_error_detection_Complete Random
file_name: vicuna_channel_4_salient_translation_error_detection_Complete Random_5000_5.pt
pruning_style: channel
community: 4
pruning_ratio: 20
dataset_label: salient_translation_error_detection
sparsity_ratio: 20
['tasksource/bigbench', 'salient_translation_error_detection']
finetune: Complete Random
modules_size: 29
modules: ['4_attn.k', '28_attn.q', '23_mlp.down', '9_attn.v', '18_attn.k', '14_attn.v', '4_gate', '13_attn.q', '25_attn.o', '5_mlp.down', '3_gate', '17_gate', '21_gate', '11_attn.q', '6_attn.v', '25_mlp.down', '30_gate', '16_attn.o', '9_gate', '30_mlp.up', '26_attn.v', '26_attn.k', '20_attn.o', '17_attn.o', '4_attn.q', '13_mlp.down', '16_mlp.up', '24_attn.o', '19_mlp.up']
rank: 2
tags: ['model: vicuna', 'repo_name: vicuna_channel_4_salient_translation_error_detection_Complete Random', 'file_name: vicuna_channel_4_salient_translation_error_detection_Complete Random_5000_5.pt', 'base_model: lmsys/vicuna-7b-v1.5', 'pruning_style: channel', 'community: 4', 'pruning_ratio: 20', 'dataset_label: salient_translation_error_detection', 'sparsity_ratio: 20', "dataset: ['tasksource/bigbench', 'salient_translation_error_detection']", 'finetune: Complete Random', 'modules_size: 29', "modules: ['4_attn.k', '28_attn.q', '23_mlp.down', '9_attn.v', '18_attn.k', '14_attn.v', '4_gate', '13_attn.q', '25_attn.o', '5_mlp.down', '3_gate', '17_gate', '21_gate', '11_attn.q', '6_attn.v', '25_mlp.down', '30_gate', '16_attn.o', '9_gate', '30_mlp.up', '26_attn.v', '26_attn.k', '20_attn.o', '17_attn.o', '4_attn.q', '13_mlp.down', '16_mlp.up', '24_attn.o', '19_mlp.up']", 'rank: 2']
text-generation-inference