| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000000002,0.05000,1.974 | |
| 0,self_attn.v_proj,0.0000000000,0.05000,1.669 | |
| 0,self_attn.q_proj,0.0000000012,0.05000,1.729 | |
| 0,self_attn.o_proj,0.0000000000,0.05000,1.706 | |
| 0,mlp.gate_proj,0.0000000007,0.05000,1.914 | |
| 0,mlp.up_proj,0.0000000007,0.05000,1.880 | |
| 0,mlp.down_proj,0.0000000000,0.05000,10.259 | |
| 1,self_attn.k_proj,0.0000000001,0.05000,1.658 | |
| 1,self_attn.v_proj,0.0000000000,0.05000,1.652 | |
| 1,self_attn.q_proj,0.0000000005,0.05000,1.732 | |
| 1,self_attn.o_proj,0.0000000000,0.05000,1.723 | |
| 1,mlp.gate_proj,0.0000000023,0.05000,1.906 | |
| 1,mlp.up_proj,0.0000000021,0.05000,1.898 | |
| 1,mlp.down_proj,0.0000008961,0.05000,10.304 | |
| 2,self_attn.k_proj,0.0000000072,0.05000,1.720 | |
| 2,self_attn.v_proj,0.0000000027,0.05000,1.684 | |
| 2,self_attn.q_proj,0.0000000268,0.05000,2.013 | |
| 2,self_attn.o_proj,0.0000000000,0.05000,1.745 | |
| 2,mlp.gate_proj,0.0000000038,0.05000,1.935 | |
| 2,mlp.up_proj,0.0000000036,0.05000,1.910 | |
| 2,mlp.down_proj,0.0000000001,0.05000,10.370 | |
| 3,self_attn.k_proj,0.0000000051,0.05000,1.693 | |
| 3,self_attn.v_proj,0.0000000022,0.05000,1.675 | |
| 3,self_attn.q_proj,0.0000000180,0.05000,1.742 | |
| 3,self_attn.o_proj,0.0000000001,0.05000,1.779 | |
| 3,mlp.gate_proj,0.0000000063,0.05000,1.927 | |
| 3,mlp.up_proj,0.0000000062,0.05000,1.915 | |
| 3,mlp.down_proj,0.0000000001,0.05000,10.372 | |
| 4,self_attn.k_proj,0.0000000074,0.05000,1.671 | |
| 4,self_attn.v_proj,0.0000000038,0.05000,1.646 | |
| 4,self_attn.q_proj,0.0000000315,0.05000,1.723 | |
| 4,self_attn.o_proj,0.0000000000,0.05000,1.728 | |
| 4,mlp.gate_proj,0.0000000122,0.05000,1.911 | |
| 4,mlp.up_proj,0.0000000119,0.05000,1.907 | |
| 4,mlp.down_proj,0.0000000002,0.05000,10.358 | |
| 5,self_attn.k_proj,0.0000000103,0.05000,1.671 | |
| 5,self_attn.v_proj,0.0000000059,0.05000,1.673 | |
| 5,self_attn.q_proj,0.0000000424,0.05000,1.719 | |
| 5,self_attn.o_proj,0.0000000000,0.05000,1.733 | |
| 5,mlp.gate_proj,0.0000000204,0.05000,1.899 | |
| 5,mlp.up_proj,0.0000000196,0.05000,1.896 | |
| 5,mlp.down_proj,0.0000000005,0.05000,10.346 | |
| 6,self_attn.k_proj,0.0000000069,0.05000,1.679 | |
| 6,self_attn.v_proj,0.0000000038,0.05000,1.696 | |
| 6,self_attn.q_proj,0.0000000270,0.05000,1.797 | |
| 6,self_attn.o_proj,0.0000000000,0.05000,1.755 | |
| 6,mlp.gate_proj,0.0000000274,0.05000,1.951 | |
| 6,mlp.up_proj,0.0000000263,0.05000,1.917 | |
| 6,mlp.down_proj,0.0000000007,0.05000,10.348 | |
| 7,self_attn.k_proj,0.0000000097,0.05000,1.676 | |
| 7,self_attn.v_proj,0.0000000049,0.05000,1.670 | |
| 7,self_attn.q_proj,0.0000000391,0.05000,1.870 | |
| 7,self_attn.o_proj,0.0000000001,0.05000,1.739 | |
| 7,mlp.gate_proj,0.0000000347,0.05000,2.106 | |
| 7,mlp.up_proj,0.0000000336,0.05000,1.917 | |
| 7,mlp.down_proj,0.0000000008,0.05000,10.379 | |
| 8,self_attn.k_proj,0.0000000091,0.05000,1.696 | |
| 8,self_attn.v_proj,0.0000000049,0.05000,1.691 | |
| 8,self_attn.q_proj,0.0000000357,0.05000,1.749 | |
| 8,self_attn.o_proj,0.0000000003,0.05000,1.743 | |
| 8,mlp.gate_proj,0.0000000405,0.05000,1.952 | |
| 8,mlp.up_proj,0.0000000386,0.05000,1.928 | |
| 8,mlp.down_proj,0.0000000011,0.05000,10.429 | |
| 9,self_attn.k_proj,0.0000000248,0.05000,1.686 | |
| 9,self_attn.v_proj,0.0000000147,0.05000,1.678 | |
| 9,self_attn.q_proj,0.0000001123,0.05000,1.757 | |
| 9,self_attn.o_proj,0.0000000005,0.05000,1.750 | |
| 9,mlp.gate_proj,0.0000000437,0.05000,1.930 | |
| 9,mlp.up_proj,0.0000000421,0.05000,1.922 | |
| 9,mlp.down_proj,0.0000000012,0.05000,10.380 | |
| 10,self_attn.k_proj,0.0000000149,0.05000,1.832 | |
| 10,self_attn.v_proj,0.0000000078,0.05000,1.673 | |
| 10,self_attn.q_proj,0.0000000632,0.05000,1.762 | |
| 10,self_attn.o_proj,0.0000000006,0.05000,1.745 | |
| 10,mlp.gate_proj,0.0000000530,0.05000,1.930 | |
| 10,mlp.up_proj,0.0000000508,0.05000,1.924 | |
| 10,mlp.down_proj,0.0000000016,0.05000,10.373 | |
| 11,self_attn.k_proj,0.0000000174,0.05000,1.683 | |
| 11,self_attn.v_proj,0.0000000082,0.05000,1.680 | |
| 11,self_attn.q_proj,0.0000000763,0.05000,1.740 | |
| 11,self_attn.o_proj,0.0000000007,0.05000,1.737 | |
| 11,mlp.gate_proj,0.0000000608,0.05000,1.929 | |
| 11,mlp.up_proj,0.0000000578,0.05000,1.922 | |
| 11,mlp.down_proj,0.0000000021,0.05000,10.403 | |
| 12,self_attn.k_proj,0.0000000232,0.05000,1.685 | |
| 12,self_attn.v_proj,0.0000000127,0.05000,1.680 | |
| 12,self_attn.q_proj,0.0000001077,0.05000,1.734 | |
| 12,self_attn.o_proj,0.0000000010,0.05000,1.739 | |
| 12,mlp.gate_proj,0.0000000679,0.05000,1.916 | |
| 12,mlp.up_proj,0.0000000650,0.05000,1.903 | |
| 12,mlp.down_proj,0.0000000024,0.05000,10.544 | |
| 13,self_attn.k_proj,0.0000000216,0.05000,1.725 | |
| 13,self_attn.v_proj,0.0000000119,0.05000,1.682 | |
| 13,self_attn.q_proj,0.0000000984,0.05000,1.740 | |
| 13,self_attn.o_proj,0.0000000008,0.05000,1.740 | |
| 13,mlp.gate_proj,0.0000000776,0.05000,1.928 | |
| 13,mlp.up_proj,0.0000000744,0.05000,1.916 | |
| 13,mlp.down_proj,0.0000000031,0.05000,10.419 | |
| 14,self_attn.k_proj,0.0000000208,0.05000,1.681 | |
| 14,self_attn.v_proj,0.0000000114,0.05000,1.667 | |
| 14,self_attn.q_proj,0.0000000948,0.05000,1.726 | |
| 14,self_attn.o_proj,0.0000000014,0.05000,1.732 | |
| 14,mlp.gate_proj,0.0000000797,0.05000,1.936 | |
| 14,mlp.up_proj,0.0000000766,0.05000,1.910 | |
| 14,mlp.down_proj,0.0000000034,0.05000,10.375 | |
| 15,self_attn.k_proj,0.0000000260,0.05000,1.708 | |
| 15,self_attn.v_proj,0.0000000144,0.05000,1.686 | |
| 15,self_attn.q_proj,0.0000001285,0.05000,1.740 | |
| 15,self_attn.o_proj,0.0000000011,0.05000,1.739 | |
| 15,mlp.gate_proj,0.0000001000,0.05000,1.947 | |
| 15,mlp.up_proj,0.0000000956,0.05000,1.984 | |
| 15,mlp.down_proj,0.0000000041,0.05000,10.378 | |
| 16,self_attn.k_proj,0.0000000244,0.05000,1.702 | |
| 16,self_attn.v_proj,0.0000000126,0.05000,1.695 | |
| 16,self_attn.q_proj,0.0000001144,0.05000,1.765 | |
| 16,self_attn.o_proj,0.0000000013,0.05000,1.739 | |
| 16,mlp.gate_proj,0.0000001086,0.05000,1.921 | |
| 16,mlp.up_proj,0.0000001038,0.05000,1.909 | |
| 16,mlp.down_proj,0.0000000048,0.05000,10.561 | |
| 17,self_attn.k_proj,0.0000000198,0.05000,1.673 | |
| 17,self_attn.v_proj,0.0000000121,0.05000,1.671 | |
| 17,self_attn.q_proj,0.0000000910,0.05000,1.734 | |
| 17,self_attn.o_proj,0.0000000017,0.05000,1.725 | |
| 17,mlp.gate_proj,0.0000001043,0.05000,1.907 | |
| 17,mlp.up_proj,0.0000001004,0.05000,1.907 | |
| 17,mlp.down_proj,0.0000000052,0.05000,10.344 | |
| 18,self_attn.k_proj,0.0000000385,0.05000,2.049 | |
| 18,self_attn.v_proj,0.0000000218,0.05000,1.699 | |
| 18,self_attn.q_proj,0.0000001757,0.05000,1.776 | |
| 18,self_attn.o_proj,0.0000000015,0.05000,1.755 | |
| 18,mlp.gate_proj,0.0000001256,0.05000,1.967 | |
| 18,mlp.up_proj,0.0000001200,0.05000,1.908 | |
| 18,mlp.down_proj,0.0000000065,0.05000,10.347 | |
| 19,self_attn.k_proj,0.0000000501,0.05000,1.685 | |
| 19,self_attn.v_proj,0.0000000309,0.05000,1.691 | |
| 19,self_attn.q_proj,0.0000002407,0.05000,1.745 | |
| 19,self_attn.o_proj,0.0000000016,0.05000,1.737 | |
| 19,mlp.gate_proj,0.0000001447,0.05000,2.317 | |
| 19,mlp.up_proj,0.0000001387,0.05000,1.923 | |
| 19,mlp.down_proj,0.0000000093,0.05000,10.378 | |
| 20,self_attn.k_proj,0.0000000189,0.05000,1.693 | |
| 20,self_attn.v_proj,0.0000000115,0.05000,1.674 | |
| 20,self_attn.q_proj,0.0000000936,0.05000,2.097 | |
| 20,self_attn.o_proj,0.0000000022,0.05000,1.745 | |
| 20,mlp.gate_proj,0.0000001753,0.05000,1.931 | |
| 20,mlp.up_proj,0.0000001662,0.05000,1.917 | |
| 20,mlp.down_proj,0.0000000123,0.05000,10.487 | |
| 21,self_attn.k_proj,0.0000000155,0.05000,1.669 | |
| 21,self_attn.v_proj,0.0000000104,0.05000,1.688 | |
| 21,self_attn.q_proj,0.0000000778,0.05000,1.737 | |
| 21,self_attn.o_proj,0.0000000039,0.05000,1.738 | |
| 21,mlp.gate_proj,0.0000001586,0.05000,1.919 | |
| 21,mlp.up_proj,0.0000001516,0.05000,1.907 | |
| 21,mlp.down_proj,0.0000000121,0.05000,10.398 | |
| 22,self_attn.k_proj,0.0000000406,0.05000,1.930 | |
| 22,self_attn.v_proj,0.0000000258,0.05000,1.795 | |
| 22,self_attn.q_proj,0.0000002221,0.05000,1.847 | |
| 22,self_attn.o_proj,0.0000000047,0.05000,1.845 | |
| 22,mlp.gate_proj,0.0000002180,0.05000,1.908 | |
| 22,mlp.up_proj,0.0000002092,0.05000,1.899 | |
| 22,mlp.down_proj,0.0000000232,0.05000,10.346 | |
| 23,self_attn.k_proj,0.0000000330,0.05000,1.688 | |
| 23,self_attn.v_proj,0.0000000227,0.05000,1.694 | |
| 23,self_attn.q_proj,0.0000001895,0.05000,1.735 | |
| 23,self_attn.o_proj,0.0000000058,0.05000,1.731 | |
| 23,mlp.gate_proj,0.0000002436,0.05000,2.232 | |
| 23,mlp.up_proj,0.0000002310,0.05000,1.919 | |
| 23,mlp.down_proj,0.0000000223,0.05000,10.404 | |
| 24,self_attn.k_proj,0.0000000284,0.05000,1.704 | |
| 24,self_attn.v_proj,0.0000000233,0.05000,1.677 | |
| 24,self_attn.q_proj,0.0000001599,0.05000,1.756 | |
| 24,self_attn.o_proj,0.0000000056,0.05000,1.740 | |
| 24,mlp.gate_proj,0.0000002843,0.05000,1.914 | |
| 24,mlp.up_proj,0.0000002675,0.05000,1.923 | |
| 24,mlp.down_proj,0.0000000246,0.05000,10.306 | |
| 25,self_attn.k_proj,0.0000000507,0.05000,1.685 | |
| 25,self_attn.v_proj,0.0000000330,0.05000,1.658 | |
| 25,self_attn.q_proj,0.0000002889,0.05000,1.731 | |
| 25,self_attn.o_proj,0.0000000067,0.05000,1.731 | |
| 25,mlp.gate_proj,0.0000003367,0.05000,1.912 | |
| 25,mlp.up_proj,0.0000003191,0.05000,1.902 | |
| 25,mlp.down_proj,0.0000000288,0.05000,10.478 | |
| 26,self_attn.k_proj,0.0000000367,0.05000,1.930 | |
| 26,self_attn.v_proj,0.0000000248,0.05000,1.656 | |
| 26,self_attn.q_proj,0.0000002028,0.05000,1.726 | |
| 26,self_attn.o_proj,0.0000000083,0.05000,1.722 | |
| 26,mlp.gate_proj,0.0000003796,0.05000,1.905 | |
| 26,mlp.up_proj,0.0000003608,0.05000,1.904 | |
| 26,mlp.down_proj,0.0000000304,0.05000,10.362 | |
| 27,self_attn.k_proj,0.0000000365,0.05000,1.719 | |
| 27,self_attn.v_proj,0.0000000260,0.05000,1.680 | |
| 27,self_attn.q_proj,0.0000001969,0.05000,1.739 | |
| 27,self_attn.o_proj,0.0000000069,0.05000,1.726 | |
| 27,mlp.gate_proj,0.0000004164,0.05000,1.978 | |
| 27,mlp.up_proj,0.0000003971,0.05000,1.906 | |
| 27,mlp.down_proj,0.0000000330,0.05000,10.315 | |
| 28,self_attn.k_proj,0.0000000359,0.05000,1.672 | |
| 28,self_attn.v_proj,0.0000000281,0.05000,1.661 | |
| 28,self_attn.q_proj,0.0000002018,0.05000,1.720 | |
| 28,self_attn.o_proj,0.0000000056,0.05000,1.825 | |
| 28,mlp.gate_proj,0.0000004448,0.05000,1.915 | |
| 28,mlp.up_proj,0.0000004269,0.05000,1.922 | |
| 28,mlp.down_proj,0.0000000380,0.05000,10.441 | |
| 29,self_attn.k_proj,0.0000000469,0.05000,1.686 | |
| 29,self_attn.v_proj,0.0000000308,0.05000,1.671 | |
| 29,self_attn.q_proj,0.0000002493,0.05000,1.732 | |
| 29,self_attn.o_proj,0.0000000091,0.05000,1.749 | |
| 29,mlp.gate_proj,0.0000004729,0.05000,1.929 | |
| 29,mlp.up_proj,0.0000004529,0.05000,1.907 | |
| 29,mlp.down_proj,0.0000000403,0.05000,10.360 | |
| 30,self_attn.k_proj,0.0000000461,0.05000,1.996 | |
| 30,self_attn.v_proj,0.0000000365,0.05000,1.671 | |
| 30,self_attn.q_proj,0.0000002671,0.05000,1.728 | |
| 30,self_attn.o_proj,0.0000000104,0.05000,1.738 | |
| 30,mlp.gate_proj,0.0000005154,0.05000,1.914 | |
| 30,mlp.up_proj,0.0000004883,0.05000,1.904 | |
| 30,mlp.down_proj,0.0000000424,0.05000,10.348 | |
| 31,self_attn.k_proj,0.0000000515,0.05000,1.688 | |
| 31,self_attn.v_proj,0.0000000394,0.05000,1.672 | |
| 31,self_attn.q_proj,0.0000002855,0.05000,1.712 | |
| 31,self_attn.o_proj,0.0000000071,0.05000,1.710 | |
| 31,mlp.gate_proj,0.0000005588,0.05000,1.907 | |
| 31,mlp.up_proj,0.0000005285,0.05000,1.895 | |
| 31,mlp.down_proj,0.0000000449,0.05000,10.287 | |
| 32,self_attn.k_proj,0.0000000566,0.05000,1.686 | |
| 32,self_attn.v_proj,0.0000000439,0.05000,1.661 | |
| 32,self_attn.q_proj,0.0000003142,0.05000,1.719 | |
| 32,self_attn.o_proj,0.0000000082,0.05000,1.721 | |
| 32,mlp.gate_proj,0.0000005844,0.05000,1.927 | |
| 32,mlp.up_proj,0.0000005537,0.05000,1.907 | |
| 32,mlp.down_proj,0.0000000477,0.05000,10.363 | |
| 33,self_attn.k_proj,0.0000000530,0.05000,1.695 | |
| 33,self_attn.v_proj,0.0000000485,0.05000,1.689 | |
| 33,self_attn.q_proj,0.0000002834,0.05000,1.735 | |
| 33,self_attn.o_proj,0.0000000060,0.05000,1.739 | |
| 33,mlp.gate_proj,0.0000006227,0.05000,1.919 | |
| 33,mlp.up_proj,0.0000005820,0.05000,1.914 | |
| 33,mlp.down_proj,0.0000000490,0.05000,10.298 | |
| 34,self_attn.k_proj,0.0000000596,0.05000,1.676 | |
| 34,self_attn.v_proj,0.0000000547,0.05000,1.676 | |
| 34,self_attn.q_proj,0.0000003310,0.05000,1.717 | |
| 34,self_attn.o_proj,0.0000000044,0.05000,1.729 | |
| 34,mlp.gate_proj,0.0000006503,0.05000,1.912 | |
| 34,mlp.up_proj,0.0000006064,0.05000,1.900 | |
| 34,mlp.down_proj,0.0000000523,0.05000,10.422 | |
| 35,self_attn.k_proj,0.0000000653,0.05000,1.674 | |
| 35,self_attn.v_proj,0.0000000614,0.05000,1.683 | |
| 35,self_attn.q_proj,0.0000003620,0.05000,2.377 | |
| 35,self_attn.o_proj,0.0000000036,0.05000,1.718 | |
| 35,mlp.gate_proj,0.0000006651,0.05000,1.926 | |
| 35,mlp.up_proj,0.0000006244,0.05000,1.910 | |
| 35,mlp.down_proj,0.0000000536,0.05000,10.552 | |
| 36,self_attn.k_proj,0.0000000689,0.05000,1.658 | |
| 36,self_attn.v_proj,0.0000000649,0.05000,1.657 | |
| 36,self_attn.q_proj,0.0000003802,0.05000,1.706 | |
| 36,self_attn.o_proj,0.0000000064,0.05000,1.718 | |
| 36,mlp.gate_proj,0.0000006757,0.05000,1.931 | |
| 36,mlp.up_proj,0.0000006380,0.05000,1.894 | |
| 36,mlp.down_proj,0.0000000534,0.05000,10.309 | |
| 37,self_attn.k_proj,0.0000000654,0.05000,1.668 | |
| 37,self_attn.v_proj,0.0000000588,0.05000,1.662 | |
| 37,self_attn.q_proj,0.0000003550,0.05000,1.710 | |
| 37,self_attn.o_proj,0.0000000057,0.05000,1.733 | |
| 37,mlp.gate_proj,0.0000006918,0.05000,2.328 | |
| 37,mlp.up_proj,0.0000006588,0.05000,1.934 | |
| 37,mlp.down_proj,0.0000000565,0.05000,10.372 | |
| 38,self_attn.k_proj,0.0000000652,0.05000,1.686 | |
| 38,self_attn.v_proj,0.0000000540,0.05000,1.697 | |
| 38,self_attn.q_proj,0.0000003431,0.05000,1.736 | |
| 38,self_attn.o_proj,0.0000000096,0.05000,1.741 | |
| 38,mlp.gate_proj,0.0000007154,0.05000,1.921 | |
| 38,mlp.up_proj,0.0000006809,0.05000,1.929 | |
| 38,mlp.down_proj,0.0000000597,0.05000,10.366 | |
| 39,self_attn.k_proj,0.0000000628,0.05000,1.715 | |
| 39,self_attn.v_proj,0.0000000543,0.05000,1.686 | |
| 39,self_attn.q_proj,0.0000003293,0.05000,1.742 | |
| 39,self_attn.o_proj,0.0000000088,0.05000,1.726 | |
| 39,mlp.gate_proj,0.0000007348,0.05000,1.888 | |
| 39,mlp.up_proj,0.0000007033,0.05000,1.889 | |
| 39,mlp.down_proj,0.0000000644,0.05000,10.275 | |
| 40,self_attn.k_proj,0.0000000626,0.05000,1.658 | |
| 40,self_attn.v_proj,0.0000000444,0.05000,1.652 | |
| 40,self_attn.q_proj,0.0000003235,0.05000,1.708 | |
| 40,self_attn.o_proj,0.0000000141,0.05000,1.716 | |
| 40,mlp.gate_proj,0.0000007610,0.05000,1.901 | |
| 40,mlp.up_proj,0.0000007342,0.05000,1.908 | |
| 40,mlp.down_proj,0.0000000727,0.05000,10.326 | |
| 41,self_attn.k_proj,0.0000000559,0.05000,1.666 | |
| 41,self_attn.v_proj,0.0000000421,0.05000,1.662 | |
| 41,self_attn.q_proj,0.0000002855,0.05000,1.738 | |
| 41,self_attn.o_proj,0.0000000170,0.05000,1.719 | |
| 41,mlp.gate_proj,0.0000008057,0.05000,1.895 | |
| 41,mlp.up_proj,0.0000007766,0.05000,1.907 | |
| 41,mlp.down_proj,0.0000000785,0.05000,10.269 | |
| 42,self_attn.k_proj,0.0000000701,0.05000,1.682 | |
| 42,self_attn.v_proj,0.0000000549,0.05000,1.672 | |
| 42,self_attn.q_proj,0.0000003824,0.05000,1.732 | |
| 42,self_attn.o_proj,0.0000000133,0.05000,1.733 | |
| 42,mlp.gate_proj,0.0000008403,0.05000,1.912 | |
| 42,mlp.up_proj,0.0000008162,0.05000,1.909 | |
| 42,mlp.down_proj,0.0000000892,0.05000,10.328 | |
| 43,self_attn.k_proj,0.0000000691,0.05000,1.662 | |
| 43,self_attn.v_proj,0.0000000489,0.05000,1.658 | |
| 43,self_attn.q_proj,0.0000003654,0.05000,1.719 | |
| 43,self_attn.o_proj,0.0000000184,0.05000,1.724 | |
| 43,mlp.gate_proj,0.0000008706,0.05000,1.906 | |
| 43,mlp.up_proj,0.0000008532,0.05000,1.898 | |
| 43,mlp.down_proj,0.0000000997,0.05000,10.280 | |
| 44,self_attn.k_proj,0.0000000654,0.05000,1.680 | |
| 44,self_attn.v_proj,0.0000000442,0.05000,1.681 | |
| 44,self_attn.q_proj,0.0000003623,0.05000,1.719 | |
| 44,self_attn.o_proj,0.0000000237,0.05000,1.722 | |
| 44,mlp.gate_proj,0.0000008908,0.05000,1.902 | |
| 44,mlp.up_proj,0.0000008894,0.05000,1.899 | |
| 44,mlp.down_proj,0.0000001206,0.05000,10.276 | |
| 45,self_attn.k_proj,0.0000000697,0.05000,1.685 | |
| 45,self_attn.v_proj,0.0000000401,0.05000,1.672 | |
| 45,self_attn.q_proj,0.0000003854,0.05000,1.723 | |
| 45,self_attn.o_proj,0.0000000327,0.05000,1.723 | |
| 45,mlp.gate_proj,0.0000009161,0.05000,1.901 | |
| 45,mlp.up_proj,0.0000009227,0.05000,1.897 | |
| 45,mlp.down_proj,0.0000002357,0.05000,10.295 | |
| 46,self_attn.k_proj,0.0000000762,0.05000,1.683 | |
| 46,self_attn.v_proj,0.0000000453,0.05000,1.669 | |
| 46,self_attn.q_proj,0.0000004139,0.05000,1.718 | |
| 46,self_attn.o_proj,0.0000000476,0.05000,1.726 | |
| 46,mlp.gate_proj,0.0000009351,0.05000,1.919 | |
| 46,mlp.up_proj,0.0000009498,0.05000,1.906 | |
| 46,mlp.down_proj,0.0000001348,0.05000,10.401 | |
| 47,self_attn.k_proj,0.0000000752,0.05000,1.771 | |
| 47,self_attn.v_proj,0.0000000472,0.05000,1.766 | |
| 47,self_attn.q_proj,0.0000004191,0.05000,1.832 | |
| 47,self_attn.o_proj,0.0000000484,0.05000,1.821 | |
| 47,mlp.gate_proj,0.0000009350,0.05000,2.010 | |
| 47,mlp.up_proj,0.0000009616,0.05000,1.989 | |
| 47,mlp.down_proj,0.0000001510,0.05000,10.687 | |
| 48,self_attn.k_proj,0.0000000725,0.05000,1.662 | |
| 48,self_attn.v_proj,0.0000000535,0.05000,1.678 | |
| 48,self_attn.q_proj,0.0000004339,0.05000,1.743 | |
| 48,self_attn.o_proj,0.0000000450,0.05000,1.716 | |
| 48,mlp.gate_proj,0.0000009859,0.05000,1.900 | |
| 48,mlp.up_proj,0.0000010179,0.05000,1.906 | |
| 48,mlp.down_proj,0.0000001680,0.05000,10.308 | |
| 49,self_attn.k_proj,0.0000000722,0.05000,1.781 | |
| 49,self_attn.v_proj,0.0000000513,0.05000,1.760 | |
| 49,self_attn.q_proj,0.0000004106,0.05000,1.806 | |
| 49,self_attn.o_proj,0.0000000500,0.05000,1.833 | |
| 49,mlp.gate_proj,0.0000009837,0.05000,2.007 | |
| 49,mlp.up_proj,0.0000010262,0.05000,2.003 | |
| 49,mlp.down_proj,0.0000001827,0.05000,10.479 | |
| 50,self_attn.k_proj,0.0000000878,0.05000,1.670 | |
| 50,self_attn.v_proj,0.0000000588,0.05000,1.668 | |
| 50,self_attn.q_proj,0.0000005187,0.05000,1.708 | |
| 50,self_attn.o_proj,0.0000000689,0.05000,1.719 | |
| 50,mlp.gate_proj,0.0000009710,0.05000,1.948 | |
| 50,mlp.up_proj,0.0000010223,0.05000,1.898 | |
| 50,mlp.down_proj,0.0000002030,0.05000,10.599 | |
| 51,self_attn.k_proj,0.0000000785,0.05000,1.850 | |
| 51,self_attn.v_proj,0.0000000516,0.05000,1.689 | |
| 51,self_attn.q_proj,0.0000004482,0.05000,1.730 | |
| 51,self_attn.o_proj,0.0000000717,0.05000,1.733 | |
| 51,mlp.gate_proj,0.0000010186,0.05000,1.912 | |
| 51,mlp.up_proj,0.0000010654,0.05000,1.934 | |
| 51,mlp.down_proj,0.0000002185,0.05000,10.323 | |
| 52,self_attn.k_proj,0.0000000687,0.05000,1.682 | |
| 52,self_attn.v_proj,0.0000000637,0.05000,1.651 | |
| 52,self_attn.q_proj,0.0000004243,0.05000,1.713 | |
| 52,self_attn.o_proj,0.0000000786,0.05000,1.719 | |
| 52,mlp.gate_proj,0.0000011731,0.05000,1.947 | |
| 52,mlp.up_proj,0.0000012116,0.05000,1.890 | |
| 52,mlp.down_proj,0.0000002340,0.05000,10.247 | |
| 53,self_attn.k_proj,0.0000000788,0.05000,1.659 | |
| 53,self_attn.v_proj,0.0000000687,0.05000,1.654 | |
| 53,self_attn.q_proj,0.0000004782,0.05000,1.724 | |
| 53,self_attn.o_proj,0.0000000906,0.05000,1.725 | |
| 53,mlp.gate_proj,0.0000012602,0.05000,1.901 | |
| 53,mlp.up_proj,0.0000012900,0.05000,1.897 | |
| 53,mlp.down_proj,0.0000002460,0.05000,10.405 | |
| 54,self_attn.k_proj,0.0000000766,0.05000,2.517 | |
| 54,self_attn.v_proj,0.0000000886,0.05000,1.708 | |
| 54,self_attn.q_proj,0.0000005082,0.05000,1.749 | |
| 54,self_attn.o_proj,0.0000000811,0.05000,1.728 | |
| 54,mlp.gate_proj,0.0000012372,0.05000,2.083 | |
| 54,mlp.up_proj,0.0000012735,0.05000,1.901 | |
| 54,mlp.down_proj,0.0000002715,0.05000,10.699 | |
| 55,self_attn.k_proj,0.0000000740,0.05000,1.671 | |
| 55,self_attn.v_proj,0.0000000864,0.05000,1.672 | |
| 55,self_attn.q_proj,0.0000004974,0.05000,1.727 | |
| 55,self_attn.o_proj,0.0000000965,0.05000,1.724 | |
| 55,mlp.gate_proj,0.0000012793,0.05000,1.915 | |
| 55,mlp.up_proj,0.0000013217,0.05000,1.901 | |
| 55,mlp.down_proj,0.0000003111,0.05000,10.333 | |
| 56,self_attn.k_proj,0.0000000757,0.05000,1.705 | |
| 56,self_attn.v_proj,0.0000000742,0.05000,1.662 | |
| 56,self_attn.q_proj,0.0000004671,0.05000,1.719 | |
| 56,self_attn.o_proj,0.0000001299,0.05000,1.707 | |
| 56,mlp.gate_proj,0.0000014066,0.05000,1.915 | |
| 56,mlp.up_proj,0.0000014399,0.05000,1.896 | |
| 56,mlp.down_proj,0.0000003492,0.05000,10.264 | |
| 57,self_attn.k_proj,0.0000000814,0.05000,1.686 | |
| 57,self_attn.v_proj,0.0000000867,0.05000,1.661 | |
| 57,self_attn.q_proj,0.0000005055,0.05000,1.717 | |
| 57,self_attn.o_proj,0.0000001356,0.05000,1.712 | |
| 57,mlp.gate_proj,0.0000013990,0.05000,1.895 | |
| 57,mlp.up_proj,0.0000014438,0.05000,1.891 | |
| 57,mlp.down_proj,0.0000003847,0.05000,10.443 | |
| 58,self_attn.k_proj,0.0000000745,0.05000,1.664 | |
| 58,self_attn.v_proj,0.0000000881,0.05000,1.659 | |
| 58,self_attn.q_proj,0.0000004971,0.05000,1.703 | |
| 58,self_attn.o_proj,0.0000001591,0.05000,1.705 | |
| 58,mlp.gate_proj,0.0000014434,0.05000,1.901 | |
| 58,mlp.up_proj,0.0000014912,0.05000,1.889 | |
| 58,mlp.down_proj,0.0000004838,0.05000,10.536 | |
| 59,self_attn.k_proj,0.0000000753,0.05000,1.677 | |
| 59,self_attn.v_proj,0.0000000926,0.05000,1.665 | |
| 59,self_attn.q_proj,0.0000004938,0.05000,1.722 | |
| 59,self_attn.o_proj,0.0000001720,0.05000,1.742 | |
| 59,mlp.gate_proj,0.0000015366,0.05000,1.903 | |
| 59,mlp.up_proj,0.0000015528,0.05000,1.898 | |
| 59,mlp.down_proj,0.0000005539,0.05000,10.287 | |
| 60,self_attn.k_proj,0.0000000820,0.05000,1.692 | |
| 60,self_attn.v_proj,0.0000001168,0.05000,1.689 | |
| 60,self_attn.q_proj,0.0000005763,0.05000,1.753 | |
| 60,self_attn.o_proj,0.0000001487,0.05000,1.720 | |
| 60,mlp.gate_proj,0.0000018750,0.05000,1.922 | |
| 60,mlp.up_proj,0.0000018547,0.05000,1.894 | |
| 60,mlp.down_proj,0.0000006279,0.05000,10.338 | |
| 61,self_attn.k_proj,0.0000000843,0.05000,1.682 | |
| 61,self_attn.v_proj,0.0000001284,0.05000,1.673 | |
| 61,self_attn.q_proj,0.0000005832,0.05000,1.728 | |
| 61,self_attn.o_proj,0.0000001704,0.05000,1.719 | |
| 61,mlp.gate_proj,0.0000020632,0.05000,1.944 | |
| 61,mlp.up_proj,0.0000020309,0.05000,1.923 | |
| 61,mlp.down_proj,0.0000007217,0.05000,10.248 | |
| 62,self_attn.k_proj,0.0000000880,0.05000,1.771 | |
| 62,self_attn.v_proj,0.0000001228,0.05000,1.671 | |
| 62,self_attn.q_proj,0.0000006076,0.05000,1.716 | |
| 62,self_attn.o_proj,0.0000001910,0.05000,1.713 | |
| 62,mlp.gate_proj,0.0000024024,0.05000,1.917 | |
| 62,mlp.up_proj,0.0000023178,0.05000,1.895 | |
| 62,mlp.down_proj,0.0000007976,0.05000,10.293 | |
| 63,self_attn.k_proj,0.0000000886,0.05000,1.658 | |
| 63,self_attn.v_proj,0.0000001268,0.05000,1.658 | |
| 63,self_attn.q_proj,0.0000005992,0.05000,1.713 | |
| 63,self_attn.o_proj,0.0000002006,0.05000,1.727 | |
| 63,mlp.gate_proj,0.0000025440,0.05000,1.906 | |
| 63,mlp.up_proj,0.0000024767,0.05000,1.891 | |
| 63,mlp.down_proj,0.0000009258,0.05000,10.266 | |
| 64,self_attn.k_proj,0.0000000947,0.05000,1.699 | |
| 64,self_attn.v_proj,0.0000001271,0.05000,1.666 | |
| 64,self_attn.q_proj,0.0000006335,0.05000,1.731 | |
| 64,self_attn.o_proj,0.0000001935,0.05000,1.729 | |
| 64,mlp.gate_proj,0.0000027792,0.05000,1.926 | |
| 64,mlp.up_proj,0.0000026894,0.05000,1.911 | |
| 64,mlp.down_proj,0.0000010580,0.05000,10.313 | |
| 65,self_attn.k_proj,0.0000000973,0.05000,1.673 | |
| 65,self_attn.v_proj,0.0000001354,0.05000,1.666 | |
| 65,self_attn.q_proj,0.0000006541,0.05000,1.719 | |
| 65,self_attn.o_proj,0.0000002121,0.05000,1.707 | |
| 65,mlp.gate_proj,0.0000030904,0.05000,1.900 | |
| 65,mlp.up_proj,0.0000029994,0.05000,1.912 | |
| 65,mlp.down_proj,0.0000011762,0.05000,10.271 | |
| 66,self_attn.k_proj,0.0000000857,0.05000,1.672 | |
| 66,self_attn.v_proj,0.0000001420,0.05000,1.662 | |
| 66,self_attn.q_proj,0.0000006095,0.05000,1.715 | |
| 66,self_attn.o_proj,0.0000002038,0.05000,1.736 | |
| 66,mlp.gate_proj,0.0000035893,0.05000,1.916 | |
| 66,mlp.up_proj,0.0000034360,0.05000,1.900 | |
| 66,mlp.down_proj,0.0000013113,0.05000,10.293 | |
| 67,self_attn.k_proj,0.0000000931,0.05000,1.689 | |
| 67,self_attn.v_proj,0.0000001635,0.05000,1.655 | |
| 67,self_attn.q_proj,0.0000006569,0.05000,1.704 | |
| 67,self_attn.o_proj,0.0000001514,0.05000,1.716 | |
| 67,mlp.gate_proj,0.0000037963,0.05000,1.903 | |
| 67,mlp.up_proj,0.0000036747,0.05000,1.892 | |
| 67,mlp.down_proj,0.0000014222,0.05000,10.266 | |
| 68,self_attn.k_proj,0.0000000962,0.05000,1.673 | |
| 68,self_attn.v_proj,0.0000001876,0.05000,1.658 | |
| 68,self_attn.q_proj,0.0000006989,0.05000,1.737 | |
| 68,self_attn.o_proj,0.0000001924,0.05000,1.712 | |
| 68,mlp.gate_proj,0.0000040879,0.05000,2.112 | |
| 68,mlp.up_proj,0.0000040017,0.05000,1.889 | |
| 68,mlp.down_proj,0.0000015691,0.05000,10.353 | |
| 69,self_attn.k_proj,0.0000000987,0.05000,1.666 | |
| 69,self_attn.v_proj,0.0000001590,0.05000,1.655 | |
| 69,self_attn.q_proj,0.0000006813,0.05000,1.701 | |
| 69,self_attn.o_proj,0.0000002237,0.05000,1.707 | |
| 69,mlp.gate_proj,0.0000043632,0.05000,1.902 | |
| 69,mlp.up_proj,0.0000043560,0.05000,1.890 | |
| 69,mlp.down_proj,0.0000019097,0.05000,10.358 | |
| 70,self_attn.k_proj,0.0000000952,0.05000,1.686 | |
| 70,self_attn.v_proj,0.0000002180,0.05000,1.663 | |
| 70,self_attn.q_proj,0.0000007084,0.05000,1.715 | |
| 70,self_attn.o_proj,0.0000002977,0.05000,1.720 | |
| 70,mlp.gate_proj,0.0000049191,0.05000,1.918 | |
| 70,mlp.up_proj,0.0000049845,0.05000,1.899 | |
| 70,mlp.down_proj,0.0000023394,0.05000,10.278 | |
| 71,self_attn.k_proj,0.0000001000,0.05000,1.660 | |
| 71,self_attn.v_proj,0.0000002286,0.05000,1.658 | |
| 71,self_attn.q_proj,0.0000007376,0.05000,1.733 | |
| 71,self_attn.o_proj,0.0000003390,0.05000,1.731 | |
| 71,mlp.gate_proj,0.0000053962,0.05000,2.021 | |
| 71,mlp.up_proj,0.0000055504,0.05000,1.898 | |
| 71,mlp.down_proj,0.0000028877,0.05000,10.313 | |
| 72,self_attn.k_proj,0.0000000952,0.05000,1.943 | |
| 72,self_attn.v_proj,0.0000002648,0.05000,1.677 | |
| 72,self_attn.q_proj,0.0000007474,0.05000,1.745 | |
| 72,self_attn.o_proj,0.0000003013,0.05000,1.734 | |
| 72,mlp.gate_proj,0.0000059621,0.05000,1.954 | |
| 72,mlp.up_proj,0.0000062113,0.05000,1.930 | |
| 72,mlp.down_proj,0.0000037827,0.05000,10.344 | |
| 73,self_attn.k_proj,0.0000000986,0.05000,1.670 | |
| 73,self_attn.v_proj,0.0000003097,0.05000,1.668 | |
| 73,self_attn.q_proj,0.0000007756,0.05000,1.735 | |
| 73,self_attn.o_proj,0.0000004082,0.05000,1.731 | |
| 73,mlp.gate_proj,0.0000064299,0.05000,1.938 | |
| 73,mlp.up_proj,0.0000067876,0.05000,1.908 | |
| 73,mlp.down_proj,0.0000047355,0.05000,10.334 | |
| 74,self_attn.k_proj,0.0000001003,0.05000,1.683 | |
| 74,self_attn.v_proj,0.0000002953,0.05000,1.667 | |
| 74,self_attn.q_proj,0.0000008356,0.05000,1.731 | |
| 74,self_attn.o_proj,0.0000004746,0.05000,1.718 | |
| 74,mlp.gate_proj,0.0000067756,0.05000,1.921 | |
| 74,mlp.up_proj,0.0000072664,0.05000,1.912 | |
| 74,mlp.down_proj,0.0000065462,0.05000,10.326 | |
| 75,self_attn.k_proj,0.0000000984,0.05000,1.681 | |
| 75,self_attn.v_proj,0.0000003474,0.05000,1.666 | |
| 75,self_attn.q_proj,0.0000008044,0.05000,1.722 | |
| 75,self_attn.o_proj,0.0000006275,0.05000,1.732 | |
| 75,mlp.gate_proj,0.0000073467,0.05000,1.916 | |
| 75,mlp.up_proj,0.0000079761,0.05000,1.917 | |
| 75,mlp.down_proj,0.0000103067,0.05000,10.338 | |
| 76,self_attn.k_proj,0.0000001002,0.05000,1.991 | |
| 76,self_attn.v_proj,0.0000005677,0.05000,1.683 | |
| 76,self_attn.q_proj,0.0000009104,0.05000,1.728 | |
| 76,self_attn.o_proj,0.0000007738,0.05000,1.726 | |
| 76,mlp.gate_proj,0.0000078915,0.05000,1.928 | |
| 76,mlp.up_proj,0.0000086448,0.05000,1.903 | |
| 76,mlp.down_proj,0.0000162721,0.05000,10.330 | |
| 77,self_attn.k_proj,0.0000000943,0.05000,1.729 | |
| 77,self_attn.v_proj,0.0000003583,0.05000,1.727 | |
| 77,self_attn.q_proj,0.0000008443,0.05000,1.744 | |
| 77,self_attn.o_proj,0.0000011174,0.05000,1.731 | |
| 77,mlp.gate_proj,0.0000083925,0.05000,2.330 | |
| 77,mlp.up_proj,0.0000092032,0.05000,1.905 | |
| 77,mlp.down_proj,0.0000187782,0.05000,10.327 | |
| 78,self_attn.k_proj,0.0000000877,0.05000,1.674 | |
| 78,self_attn.v_proj,0.0000003851,0.05000,1.679 | |
| 78,self_attn.q_proj,0.0000007940,0.05000,1.726 | |
| 78,self_attn.o_proj,0.0000012265,0.05000,1.742 | |
| 78,mlp.gate_proj,0.0000077649,0.05000,1.977 | |
| 78,mlp.up_proj,0.0000083943,0.05000,1.974 | |
| 78,mlp.down_proj,0.0000338986,0.05000,10.428 | |
| 79,self_attn.k_proj,0.0000000757,0.05000,1.670 | |
| 79,self_attn.v_proj,0.0000001361,0.05000,1.666 | |
| 79,self_attn.q_proj,0.0000005678,0.05000,1.748 | |
| 79,self_attn.o_proj,0.0000003669,0.05000,1.729 | |
| 79,mlp.gate_proj,0.0000072500,0.05000,1.921 | |
| 79,mlp.up_proj,0.0000076144,0.05000,1.927 | |
| 79,mlp.down_proj,0.0001956243,0.05000,10.314 | |