Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Clean up; add gemma-2-2b-it #12

Open
wants to merge 2 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
319 changes: 319 additions & 0 deletions model_snr_results/snr_results_google-gemma-2-2b-it.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,319 @@
{
"mlp.down_proj": {
"model.layers.4.mlp.down_proj": 33.30361557006836,
"model.layers.2.mlp.down_proj": 28.84607696533203,
"model.layers.6.mlp.down_proj": 19.587360382080078,
"model.layers.15.mlp.down_proj": 15.88519287109375,
"model.layers.24.mlp.down_proj": 15.06785774230957,
"model.layers.14.mlp.down_proj": 13.604269027709961,
"model.layers.17.mlp.down_proj": 13.215081214904785,
"model.layers.25.mlp.down_proj": 13.187742233276367,
"model.layers.22.mlp.down_proj": 12.597224235534668,
"model.layers.23.mlp.down_proj": 11.809103965759277,
"model.layers.20.mlp.down_proj": 11.670610427856445,
"model.layers.5.mlp.down_proj": 11.197671890258789,
"model.layers.21.mlp.down_proj": 9.488790512084961,
"model.layers.7.mlp.down_proj": 9.305631637573242,
"model.layers.18.mlp.down_proj": 9.030320167541504,
"model.layers.13.mlp.down_proj": 8.854863166809082,
"model.layers.3.mlp.down_proj": 8.736675262451172,
"model.layers.0.mlp.down_proj": 8.105010032653809,
"model.layers.19.mlp.down_proj": 7.772491455078125,
"model.layers.10.mlp.down_proj": 7.373418807983398,
"model.layers.16.mlp.down_proj": 7.208968639373779,
"model.layers.8.mlp.down_proj": 6.769254207611084,
"model.layers.11.mlp.down_proj": 6.636877536773682,
"model.layers.12.mlp.down_proj": 5.944761753082275,
"model.layers.9.mlp.down_proj": 5.525699615478516,
"model.layers.1.mlp.down_proj": 4.299622535705566
},
"mlp.up_proj": {
"model.layers.4.mlp.up_proj": 170.2850799560547,
"model.layers.2.mlp.up_proj": 124.66849517822266,
"model.layers.3.mlp.up_proj": 112.8239517211914,
"model.layers.6.mlp.up_proj": 48.43644332885742,
"model.layers.1.mlp.up_proj": 41.71646499633789,
"model.layers.5.mlp.up_proj": 32.67828369140625,
"model.layers.0.mlp.up_proj": 28.067331314086914,
"model.layers.7.mlp.up_proj": 28.041343688964844,
"model.layers.17.mlp.up_proj": 26.711233139038086,
"model.layers.15.mlp.up_proj": 21.886568069458008,
"model.layers.10.mlp.up_proj": 19.634605407714844,
"model.layers.9.mlp.up_proj": 16.594703674316406,
"model.layers.18.mlp.up_proj": 16.550199508666992,
"model.layers.12.mlp.up_proj": 15.803447723388672,
"model.layers.11.mlp.up_proj": 15.281010627746582,
"model.layers.16.mlp.up_proj": 15.040379524230957,
"model.layers.8.mlp.up_proj": 14.842131614685059,
"model.layers.19.mlp.up_proj": 13.117680549621582,
"model.layers.14.mlp.up_proj": 11.41967487335205,
"model.layers.20.mlp.up_proj": 11.295614242553711,
"model.layers.21.mlp.up_proj": 10.831307411193848,
"model.layers.23.mlp.up_proj": 9.982320785522461,
"model.layers.13.mlp.up_proj": 9.852916717529297,
"model.layers.24.mlp.up_proj": 7.668051719665527,
"model.layers.22.mlp.up_proj": 7.442222595214844,
"model.layers.25.mlp.up_proj": 4.745918273925781
},
"self_attn.k_proj": {
"model.layers.20.self_attn.k_proj": 1.2623848915100098,
"model.layers.21.self_attn.k_proj": 1.126978874206543,
"model.layers.2.self_attn.k_proj": 1.0654395818710327,
"model.layers.1.self_attn.k_proj": 1.0484901666641235,
"model.layers.3.self_attn.k_proj": 0.9912707805633545,
"model.layers.19.self_attn.k_proj": 0.9845684170722961,
"model.layers.18.self_attn.k_proj": 0.9728671312332153,
"model.layers.4.self_attn.k_proj": 0.9639020562171936,
"model.layers.6.self_attn.k_proj": 0.9274349808692932,
"model.layers.8.self_attn.k_proj": 0.9095296263694763,
"model.layers.15.self_attn.k_proj": 0.9011291265487671,
"model.layers.17.self_attn.k_proj": 0.9004068970680237,
"model.layers.23.self_attn.k_proj": 0.8472215533256531,
"model.layers.5.self_attn.k_proj": 0.8334033489227295,
"model.layers.12.self_attn.k_proj": 0.8052268028259277,
"model.layers.14.self_attn.k_proj": 0.7967967391014099,
"model.layers.24.self_attn.k_proj": 0.7792221903800964,
"model.layers.9.self_attn.k_proj": 0.7442198395729065,
"model.layers.22.self_attn.k_proj": 0.738936185836792,
"model.layers.16.self_attn.k_proj": 0.7356035113334656,
"model.layers.13.self_attn.k_proj": 0.7267259955406189,
"model.layers.7.self_attn.k_proj": 0.7121332883834839,
"model.layers.25.self_attn.k_proj": 0.7094318270683289,
"model.layers.10.self_attn.k_proj": 0.6790370345115662,
"model.layers.11.self_attn.k_proj": 0.6573328971862793,
"model.layers.0.self_attn.k_proj": 0.5670744776725769
},
"self_attn.o_proj": {
"model.layers.25.self_attn.o_proj": 0.3131503760814667,
"model.layers.6.self_attn.o_proj": 0.30267348885536194,
"model.layers.5.self_attn.o_proj": 0.29917699098587036,
"model.layers.4.self_attn.o_proj": 0.294284462928772,
"model.layers.1.self_attn.o_proj": 0.29038190841674805,
"model.layers.15.self_attn.o_proj": 0.279990553855896,
"model.layers.7.self_attn.o_proj": 0.2798372209072113,
"model.layers.3.self_attn.o_proj": 0.27829504013061523,
"model.layers.2.self_attn.o_proj": 0.27560076117515564,
"model.layers.12.self_attn.o_proj": 0.27154284715652466,
"model.layers.8.self_attn.o_proj": 0.25681808590888977,
"model.layers.11.self_attn.o_proj": 0.2539152503013611,
"model.layers.17.self_attn.o_proj": 0.2529059052467346,
"model.layers.0.self_attn.o_proj": 0.25265467166900635,
"model.layers.13.self_attn.o_proj": 0.25026363134384155,
"model.layers.22.self_attn.o_proj": 0.24831214547157288,
"model.layers.10.self_attn.o_proj": 0.24782003462314606,
"model.layers.14.self_attn.o_proj": 0.2316737025976181,
"model.layers.9.self_attn.o_proj": 0.2291463017463684,
"model.layers.16.self_attn.o_proj": 0.2279209941625595,
"model.layers.19.self_attn.o_proj": 0.2066410332918167,
"model.layers.23.self_attn.o_proj": 0.20168422162532806,
"model.layers.20.self_attn.o_proj": 0.20063552260398865,
"model.layers.21.self_attn.o_proj": 0.1952311396598816,
"model.layers.24.self_attn.o_proj": 0.18264922499656677,
"model.layers.18.self_attn.o_proj": 0.1780945062637329
},
"self_attn.q_proj": {
"model.layers.14.self_attn.q_proj": 0.5165186524391174,
"model.layers.6.self_attn.q_proj": 0.4943715035915375,
"model.layers.17.self_attn.q_proj": 0.47298240661621094,
"model.layers.16.self_attn.q_proj": 0.4636949300765991,
"model.layers.12.self_attn.q_proj": 0.4446524381637573,
"model.layers.10.self_attn.q_proj": 0.4427404999732971,
"model.layers.13.self_attn.q_proj": 0.4392520785331726,
"model.layers.15.self_attn.q_proj": 0.42862948775291443,
"model.layers.7.self_attn.q_proj": 0.42357802391052246,
"model.layers.19.self_attn.q_proj": 0.4219931662082672,
"model.layers.11.self_attn.q_proj": 0.4105197787284851,
"model.layers.18.self_attn.q_proj": 0.40164801478385925,
"model.layers.21.self_attn.q_proj": 0.397067129611969,
"model.layers.4.self_attn.q_proj": 0.3742890954017639,
"model.layers.20.self_attn.q_proj": 0.36900317668914795,
"model.layers.2.self_attn.q_proj": 0.3575708866119385,
"model.layers.23.self_attn.q_proj": 0.3568076491355896,
"model.layers.22.self_attn.q_proj": 0.351676344871521,
"model.layers.9.self_attn.q_proj": 0.3485497236251831,
"model.layers.1.self_attn.q_proj": 0.3282804489135742,
"model.layers.5.self_attn.q_proj": 0.315373957157135,
"model.layers.24.self_attn.q_proj": 0.28249993920326233,
"model.layers.3.self_attn.q_proj": 0.28181594610214233,
"model.layers.8.self_attn.q_proj": 0.26795536279678345,
"model.layers.0.self_attn.q_proj": 0.20543718338012695,
"model.layers.25.self_attn.q_proj": 0.19488219916820526
},
"self_attn.v_proj": {
"model.layers.18.self_attn.v_proj": 8.96899127960205,
"model.layers.19.self_attn.v_proj": 5.689997673034668,
"model.layers.4.self_attn.v_proj": 5.57612419128418,
"model.layers.25.self_attn.v_proj": 5.519944190979004,
"model.layers.21.self_attn.v_proj": 4.606760025024414,
"model.layers.15.self_attn.v_proj": 4.523311614990234,
"model.layers.7.self_attn.v_proj": 4.476346015930176,
"model.layers.3.self_attn.v_proj": 4.074836254119873,
"model.layers.17.self_attn.v_proj": 4.035794734954834,
"model.layers.2.self_attn.v_proj": 3.826523780822754,
"model.layers.24.self_attn.v_proj": 3.7527880668640137,
"model.layers.20.self_attn.v_proj": 3.703176498413086,
"model.layers.14.self_attn.v_proj": 3.437045097351074,
"model.layers.5.self_attn.v_proj": 2.7114996910095215,
"model.layers.23.self_attn.v_proj": 2.575815200805664,
"model.layers.1.self_attn.v_proj": 2.421088218688965,
"model.layers.13.self_attn.v_proj": 2.371032476425171,
"model.layers.11.self_attn.v_proj": 2.1319024562835693,
"model.layers.8.self_attn.v_proj": 1.7037322521209717,
"model.layers.9.self_attn.v_proj": 1.6977472305297852,
"model.layers.16.self_attn.v_proj": 1.5405595302581787,
"model.layers.12.self_attn.v_proj": 1.520254135131836,
"model.layers.6.self_attn.v_proj": 1.4515656232833862,
"model.layers.10.self_attn.v_proj": 1.4224656820297241,
"model.layers.0.self_attn.v_proj": 1.3283824920654297,
"model.layers.22.self_attn.v_proj": 0.9253509640693665
},
"mlp.gate_proj": {
"model.layers.1.mlp.gate_proj": 22.19009780883789,
"model.layers.2.mlp.gate_proj": 21.98990249633789,
"model.layers.0.mlp.gate_proj": 17.114286422729492,
"model.layers.3.mlp.gate_proj": 16.797019958496094,
"model.layers.4.mlp.gate_proj": 11.603490829467773,
"model.layers.6.mlp.gate_proj": 6.690526008605957,
"model.layers.5.mlp.gate_proj": 6.205199241638184,
"model.layers.24.mlp.gate_proj": 4.2970757484436035,
"model.layers.21.mlp.gate_proj": 4.259458541870117,
"model.layers.23.mlp.gate_proj": 4.240945816040039,
"model.layers.20.mlp.gate_proj": 4.202367782592773,
"model.layers.12.mlp.gate_proj": 4.017270565032959,
"model.layers.25.mlp.gate_proj": 3.916248321533203,
"model.layers.10.mlp.gate_proj": 3.850186586380005,
"model.layers.19.mlp.gate_proj": 3.7126221656799316,
"model.layers.17.mlp.gate_proj": 3.680795431137085,
"model.layers.15.mlp.gate_proj": 3.6055760383605957,
"model.layers.22.mlp.gate_proj": 3.5673747062683105,
"model.layers.18.mlp.gate_proj": 3.4207923412323,
"model.layers.13.mlp.gate_proj": 3.4158849716186523,
"model.layers.14.mlp.gate_proj": 3.331536054611206,
"model.layers.9.mlp.gate_proj": 3.2925198078155518,
"model.layers.11.mlp.gate_proj": 3.2574970722198486,
"model.layers.16.mlp.gate_proj": 3.216805934906006,
"model.layers.7.mlp.gate_proj": 3.2015552520751953,
"model.layers.8.mlp.gate_proj": 2.326204299926758
},
"input_layernorm": {
"model.layers.0.input_layernorm": Infinity,
"model.layers.1.input_layernorm": Infinity,
"model.layers.2.input_layernorm": Infinity,
"model.layers.3.input_layernorm": Infinity,
"model.layers.4.input_layernorm": Infinity,
"model.layers.5.input_layernorm": Infinity,
"model.layers.6.input_layernorm": Infinity,
"model.layers.7.input_layernorm": Infinity,
"model.layers.8.input_layernorm": Infinity,
"model.layers.9.input_layernorm": Infinity,
"model.layers.10.input_layernorm": Infinity,
"model.layers.11.input_layernorm": Infinity,
"model.layers.12.input_layernorm": Infinity,
"model.layers.13.input_layernorm": Infinity,
"model.layers.14.input_layernorm": Infinity,
"model.layers.15.input_layernorm": Infinity,
"model.layers.16.input_layernorm": Infinity,
"model.layers.17.input_layernorm": Infinity,
"model.layers.18.input_layernorm": Infinity,
"model.layers.19.input_layernorm": Infinity,
"model.layers.20.input_layernorm": Infinity,
"model.layers.21.input_layernorm": Infinity,
"model.layers.22.input_layernorm": Infinity,
"model.layers.23.input_layernorm": Infinity,
"model.layers.24.input_layernorm": Infinity,
"model.layers.25.input_layernorm": Infinity
},
"lm_head": {
"lm_head": 3.2275562286376953
},
"model.embed_tokens": {
"model.embed_tokens": 3.2275562286376953
},
"model.norm": {
"model.norm": Infinity
},
"post_attention_layernorm": {
"model.layers.0.post_attention_layernorm": Infinity,
"model.layers.1.post_attention_layernorm": Infinity,
"model.layers.2.post_attention_layernorm": Infinity,
"model.layers.3.post_attention_layernorm": Infinity,
"model.layers.4.post_attention_layernorm": Infinity,
"model.layers.5.post_attention_layernorm": Infinity,
"model.layers.6.post_attention_layernorm": Infinity,
"model.layers.7.post_attention_layernorm": Infinity,
"model.layers.8.post_attention_layernorm": Infinity,
"model.layers.9.post_attention_layernorm": Infinity,
"model.layers.10.post_attention_layernorm": Infinity,
"model.layers.11.post_attention_layernorm": Infinity,
"model.layers.12.post_attention_layernorm": Infinity,
"model.layers.13.post_attention_layernorm": Infinity,
"model.layers.14.post_attention_layernorm": Infinity,
"model.layers.15.post_attention_layernorm": Infinity,
"model.layers.16.post_attention_layernorm": Infinity,
"model.layers.17.post_attention_layernorm": Infinity,
"model.layers.18.post_attention_layernorm": Infinity,
"model.layers.19.post_attention_layernorm": Infinity,
"model.layers.20.post_attention_layernorm": Infinity,
"model.layers.21.post_attention_layernorm": Infinity,
"model.layers.22.post_attention_layernorm": Infinity,
"model.layers.23.post_attention_layernorm": Infinity,
"model.layers.24.post_attention_layernorm": Infinity,
"model.layers.25.post_attention_layernorm": Infinity
},
"post_feedforward_layernorm": {
"model.layers.0.post_feedforward_layernorm": Infinity,
"model.layers.1.post_feedforward_layernorm": Infinity,
"model.layers.2.post_feedforward_layernorm": Infinity,
"model.layers.3.post_feedforward_layernorm": Infinity,
"model.layers.4.post_feedforward_layernorm": Infinity,
"model.layers.5.post_feedforward_layernorm": Infinity,
"model.layers.6.post_feedforward_layernorm": Infinity,
"model.layers.7.post_feedforward_layernorm": Infinity,
"model.layers.8.post_feedforward_layernorm": Infinity,
"model.layers.9.post_feedforward_layernorm": Infinity,
"model.layers.10.post_feedforward_layernorm": Infinity,
"model.layers.11.post_feedforward_layernorm": Infinity,
"model.layers.12.post_feedforward_layernorm": Infinity,
"model.layers.13.post_feedforward_layernorm": Infinity,
"model.layers.14.post_feedforward_layernorm": Infinity,
"model.layers.15.post_feedforward_layernorm": Infinity,
"model.layers.16.post_feedforward_layernorm": Infinity,
"model.layers.17.post_feedforward_layernorm": Infinity,
"model.layers.18.post_feedforward_layernorm": Infinity,
"model.layers.19.post_feedforward_layernorm": Infinity,
"model.layers.20.post_feedforward_layernorm": Infinity,
"model.layers.21.post_feedforward_layernorm": Infinity,
"model.layers.22.post_feedforward_layernorm": Infinity,
"model.layers.23.post_feedforward_layernorm": Infinity,
"model.layers.24.post_feedforward_layernorm": Infinity,
"model.layers.25.post_feedforward_layernorm": Infinity
},
"pre_feedforward_layernorm": {
"model.layers.0.pre_feedforward_layernorm": Infinity,
"model.layers.1.pre_feedforward_layernorm": Infinity,
"model.layers.2.pre_feedforward_layernorm": Infinity,
"model.layers.3.pre_feedforward_layernorm": Infinity,
"model.layers.4.pre_feedforward_layernorm": Infinity,
"model.layers.5.pre_feedforward_layernorm": Infinity,
"model.layers.6.pre_feedforward_layernorm": Infinity,
"model.layers.7.pre_feedforward_layernorm": Infinity,
"model.layers.8.pre_feedforward_layernorm": Infinity,
"model.layers.9.pre_feedforward_layernorm": Infinity,
"model.layers.10.pre_feedforward_layernorm": Infinity,
"model.layers.11.pre_feedforward_layernorm": Infinity,
"model.layers.12.pre_feedforward_layernorm": Infinity,
"model.layers.13.pre_feedforward_layernorm": Infinity,
"model.layers.14.pre_feedforward_layernorm": Infinity,
"model.layers.15.pre_feedforward_layernorm": Infinity,
"model.layers.16.pre_feedforward_layernorm": Infinity,
"model.layers.17.pre_feedforward_layernorm": Infinity,
"model.layers.18.pre_feedforward_layernorm": Infinity,
"model.layers.19.pre_feedforward_layernorm": Infinity,
"model.layers.20.pre_feedforward_layernorm": Infinity,
"model.layers.21.pre_feedforward_layernorm": Infinity,
"model.layers.22.pre_feedforward_layernorm": Infinity,
"model.layers.23.pre_feedforward_layernorm": Infinity,
"model.layers.24.pre_feedforward_layernorm": Infinity,
"model.layers.25.pre_feedforward_layernorm": Infinity
}

Loading