Text Generation
Transformers
Safetensors
llama
model: llama
repo_name: llama_channel_0_sociology_Complete Random
file_name: llama_channel_0_sociology_Complete Random_5000_5.pt
pruning_style: channel
community: 0
pruning_ratio: 20
dataset_label: sociology
sparsity_ratio: 20
['tasksource/mmlu', 'sociology']
finetune: Complete Random
modules_size: 51
modules: ['12_gate', '30_attn.o', '29_attn.k', '27_mlp.up', '9_mlp.up', '12_mlp.down', '10_attn.q', '24_attn.o', '19_attn.v', '14_mlp.up', '3_gate', '7_mlp.up', '30_gate', '17_mlp.up', '18_mlp.up', '18_gate', '28_attn.v', '19_mlp.down', '19_gate', '26_mlp.up', '28_attn.q', '10_mlp.down', '13_attn.o', '20_gate', '11_gate', '13_attn.k', '9_attn.v', '13_mlp.up', '6_attn.v', '21_attn.o', '18_attn.o', '17_attn.k', '6_attn.k', '13_attn.v', '22_attn.q', '5_gate', '11_mlp.up', '29_mlp.down', '8_mlp.down', '20_mlp.up', '23_mlp.down', '11_attn.k', '6_attn.o', '19_attn.o', '7_mlp.down', '14_attn.k', '11_attn.q', '10_attn.o', '17_attn.q', '23_attn.v', '23_attn.k']
rank: 2
tags: ['model: llama', 'repo_name: llama_channel_0_sociology_Complete Random', 'file_name: llama_channel_0_sociology_Complete Random_5000_5.pt', 'base_model: meta-llama/Llama-2-7b-hf', 'pruning_style: channel', 'community: 0', 'pruning_ratio: 20', 'dataset_label: sociology', 'sparsity_ratio: 20', "dataset: ['tasksource/mmlu', 'sociology']", 'finetune: Complete Random', 'modules_size: 51', "modules: ['12_gate', '30_attn.o', '29_attn.k', '27_mlp.up', '9_mlp.up', '12_mlp.down', '10_attn.q', '24_attn.o', '19_attn.v', '14_mlp.up', '3_gate', '7_mlp.up', '30_gate', '17_mlp.up', '18_mlp.up', '18_gate', '28_attn.v', '19_mlp.down', '19_gate', '26_mlp.up', '28_attn.q', '10_mlp.down', '13_attn.o', '20_gate', '11_gate', '13_attn.k', '9_attn.v', '13_mlp.up', '6_attn.v', '21_attn.o', '18_attn.o', '17_attn.k', '6_attn.k', '13_attn.v', '22_attn.q', '5_gate', '11_mlp.up', '29_mlp.down', '8_mlp.down', '20_mlp.up', '23_mlp.down', '11_attn.k', '6_attn.o', '19_attn.o', '7_mlp.down', '14_attn.k', '11_attn.q', '10_attn.o', '17_attn.q', '23_attn.v', '23_attn.k']", 'rank: 2']
text-generation-inference