Text Generation
Transformers
Safetensors
llama
model: vicuna
repo_name: vicuna_channel_2_global_facts_Community
file_name: vicuna_channel_2_global_facts_Community_5000_5.pt
pruning_style: channel
community: 2
pruning_ratio: 20
dataset_label: global_facts
sparsity_ratio: 20
['tasksource/mmlu', 'global_facts']
finetune: Community
modules_size: 54
modules: ['10_attn.o', '10_attn.q', '11_attn.o', '11_attn.q', '11_mlp.down', '11_mlp.up', '12_attn.o', '12_attn.q', '12_gate', '12_mlp.down', '13_gate', '13_mlp.down', '13_mlp.up', '14_attn.k', '14_attn.o', '14_attn.v', '14_gate', '15_gate', '16_mlp.up', '17_mlp.down', '17_mlp.up', '18_attn.k', '18_attn.o', '18_gate', '19_attn.k', '19_attn.q', '20_attn.k', '20_attn.o', '21_gate', '21_mlp.down', '22_attn.q', '23_attn.v', '23_gate', '24_attn.v', '27_gate', '28_attn.o', '28_gate', '29_attn.k', '29_attn.o', '29_mlp.up', '30_attn.v', '3_attn.v', '3_gate', '4_attn.k', '4_attn.q', '4_mlp.up', '5_attn.k', '5_attn.v', '6_mlp.up', '8_attn.v', '8_mlp.up', '9_attn.q', '9_attn.v', '9_mlp.down']
rank: 1
tags: ['model: vicuna', 'repo_name: vicuna_channel_2_global_facts_Community', 'file_name: vicuna_channel_2_global_facts_Community_5000_5.pt', 'base_model: lmsys/vicuna-7b-v1.5', 'pruning_style: channel', 'community: 2', 'pruning_ratio: 20', 'dataset_label: global_facts', 'sparsity_ratio: 20', "dataset: ['tasksource/mmlu', 'global_facts']", 'finetune: Community', 'modules_size: 54', "modules: ['10_attn.o', '10_attn.q', '11_attn.o', '11_attn.q', '11_mlp.down', '11_mlp.up', '12_attn.o', '12_attn.q', '12_gate', '12_mlp.down', '13_gate', '13_mlp.down', '13_mlp.up', '14_attn.k', '14_attn.o', '14_attn.v', '14_gate', '15_gate', '16_mlp.up', '17_mlp.down', '17_mlp.up', '18_attn.k', '18_attn.o', '18_gate', '19_attn.k', '19_attn.q', '20_attn.k', '20_attn.o', '21_gate', '21_mlp.down', '22_attn.q', '23_attn.v', '23_gate', '24_attn.v', '27_gate', '28_attn.o', '28_gate', '29_attn.k', '29_attn.o', '29_mlp.up', '30_attn.v', '3_attn.v', '3_gate', '4_attn.k', '4_attn.q', '4_mlp.up', '5_attn.k', '5_attn.v', '6_mlp.up', '8_attn.v', '8_mlp.up', '9_attn.q', '9_attn.v', '9_mlp.down']", 'rank: 1']
text-generation-inference