row,layer_id,short_id,layer_type,param_type,shape,nparam,nnz,sparsity,tile_shape,n_tile,n_tile_total,tile_avg,tile_min,tile_med,tile_max,col_avg,col_min,col_med,col_max,row_avg,row_min,row_med,row_max 0,model.layers.0.self_attn.q_proj,tx.0.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.06787109375,0.29833984375,0.66650390625,0.2998046875,0.0,0.03125,1.0,0.2998046875,0.0,0.3125,0.875 1,model.layers.0.self_attn.k_proj,tx.0.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.0712890625,0.2978515625,0.66748046875,0.2998046875,0.0,0.03125,1.0,0.2998046875,0.0,0.3125,0.8125 2,model.layers.0.self_attn.v_proj,tx.0.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.0791015625,0.29345703125,0.62255859375,0.2998046875,0.0,0.0546875,1.0,0.2998046875,0.0,0.3125,0.8125 3,model.layers.0.self_attn.o_proj,tx.0.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.0283203125,0.21826171875,0.9521484375,0.2998046875,0.0,0.2109375,1.0,0.2998046875,0.0,0.25,1.0 4,model.layers.0.mlp.gate_proj,tx.0.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2431640625,0.2978515625,0.40576171875,0.2998046875,0.015625,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 5,model.layers.0.mlp.up_proj,tx.0.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25244140625,0.2978515625,0.4130859375,0.2998046875,0.0234375,0.296875,1.0,0.2998046875,0.0,0.3125,0.9375 6,model.layers.0.mlp.down_proj,tx.0.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.2001953125,0.30029296875,0.38623046875,0.2999442219734192,0.0,0.3046875,0.671875,0.2999442219734192,0.0,0.3125,0.9375 7,model.layers.1.self_attn.q_proj,tx.1.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.17529296875,0.29833984375,0.5009765625,0.2998046875,0.0,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 8,model.layers.1.self_attn.k_proj,tx.1.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.16796875,0.2998046875,0.482421875,0.2998046875,0.0,0.3125,1.0,0.2998046875,0.0,0.3125,0.875 9,model.layers.1.self_attn.v_proj,tx.1.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.1787109375,0.2978515625,0.4599609375,0.2998046875,0.0,0.3125,1.0,0.2998046875,0.0,0.3125,0.8125 10,model.layers.1.self_attn.o_proj,tx.1.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.11083984375,0.2783203125,0.796875,0.2998046875,0.0078125,0.2578125,0.9921875,0.2998046875,0.0,0.25,1.0 11,model.layers.1.mlp.gate_proj,tx.1.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2421875,0.2978515625,0.40185546875,0.2998046875,0.046875,0.296875,1.0,0.2998046875,0.0,0.3125,0.9375 12,model.layers.1.mlp.up_proj,tx.1.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25048828125,0.2978515625,0.39892578125,0.2998046875,0.046875,0.296875,1.0,0.2998046875,0.0,0.3125,0.9375 13,model.layers.1.mlp.down_proj,tx.1.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22607421875,0.30078125,0.38818359375,0.2999442219734192,0.0,0.3125,0.5859375,0.2999442219734192,0.0,0.3125,0.9375 14,model.layers.2.self_attn.q_proj,tx.2.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.1982421875,0.2998046875,0.4267578125,0.2998046875,0.0,0.3203125,1.0,0.2998046875,0.0,0.3125,0.875 15,model.layers.2.self_attn.k_proj,tx.2.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.20703125,0.30029296875,0.43310546875,0.2998046875,0.0,0.3203125,1.0,0.2998046875,0.0,0.3125,0.8125 16,model.layers.2.self_attn.v_proj,tx.2.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2265625,0.29931640625,0.41015625,0.2998046875,0.015625,0.3125,1.0,0.2998046875,0.0,0.3125,0.875 17,model.layers.2.self_attn.o_proj,tx.2.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.125,0.2587890625,0.783203125,0.2998046875,0.0,0.2578125,0.953125,0.2998046875,0.0,0.25,1.0 18,model.layers.2.mlp.gate_proj,tx.2.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25146484375,0.2978515625,0.40869140625,0.2998046875,0.0390625,0.296875,1.0,0.2998046875,0.0,0.3125,0.875 19,model.layers.2.mlp.up_proj,tx.2.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.244140625,0.2978515625,0.4052734375,0.2998046875,0.0703125,0.296875,1.0,0.2998046875,0.0,0.3125,0.875 20,model.layers.2.mlp.down_proj,tx.2.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22119140625,0.2998046875,0.39111328125,0.2999442219734192,0.0078125,0.3046875,0.65625,0.2999442219734192,0.0,0.3125,0.9375 21,model.layers.3.self_attn.q_proj,tx.3.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.2314453125,0.30029296875,0.3857421875,0.2998046875,0.0,0.3125,1.0,0.2998046875,0.0,0.3125,0.875 22,model.layers.3.self_attn.k_proj,tx.3.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.21630859375,0.30029296875,0.380859375,0.2998046875,0.0,0.3125,1.0,0.2998046875,0.0,0.3125,0.8125 23,model.layers.3.self_attn.v_proj,tx.3.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2451171875,0.29931640625,0.3828125,0.2998046875,0.015625,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 24,model.layers.3.self_attn.o_proj,tx.3.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.14453125,0.287109375,0.521484375,0.2998046875,0.0078125,0.2890625,0.7421875,0.2998046875,0.0,0.3125,1.0 25,model.layers.3.mlp.gate_proj,tx.3.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24853515625,0.29833984375,0.39892578125,0.2998046875,0.0234375,0.296875,1.0,0.2998046875,0.0,0.3125,0.875 26,model.layers.3.mlp.up_proj,tx.3.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24609375,0.29833984375,0.40087890625,0.2998046875,0.0703125,0.296875,1.0,0.2998046875,0.0,0.3125,0.875 27,model.layers.3.mlp.down_proj,tx.3.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22705078125,0.29931640625,0.3720703125,0.2999442219734192,0.0,0.3046875,0.609375,0.2999442219734192,0.0,0.3125,0.875 28,model.layers.4.self_attn.q_proj,tx.4.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.2177734375,0.30029296875,0.373046875,0.2998046875,0.0,0.3125,1.0,0.2998046875,0.0,0.3125,0.875 29,model.layers.4.self_attn.k_proj,tx.4.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2197265625,0.30029296875,0.3916015625,0.2998046875,0.0,0.3125,1.0,0.2998046875,0.0,0.3125,0.875 30,model.layers.4.self_attn.v_proj,tx.4.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23974609375,0.2998046875,0.384765625,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.8125 31,model.layers.4.self_attn.o_proj,tx.4.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.14208984375,0.2685546875,0.74365234375,0.2998046875,0.0,0.265625,0.8984375,0.2998046875,0.0,0.25,1.0 32,model.layers.4.mlp.gate_proj,tx.4.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24560546875,0.2998046875,0.37841796875,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 33,model.layers.4.mlp.up_proj,tx.4.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25244140625,0.2998046875,0.37353515625,0.2998046875,0.0625,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 34,model.layers.4.mlp.down_proj,tx.4.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.23291015625,0.30029296875,0.37158203125,0.2999442219734192,0.0078125,0.296875,0.8359375,0.2999442219734192,0.0,0.3125,0.9375 35,model.layers.5.self_attn.q_proj,tx.5.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.21484375,0.30029296875,0.37890625,0.2998046875,0.0,0.3125,0.6796875,0.2998046875,0.0,0.3125,0.875 36,model.layers.5.self_attn.k_proj,tx.5.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2158203125,0.30029296875,0.3759765625,0.2998046875,0.0,0.3125,0.75,0.2998046875,0.0,0.3125,0.875 37,model.layers.5.self_attn.v_proj,tx.5.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.24560546875,0.2998046875,0.3876953125,0.2998046875,0.015625,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 38,model.layers.5.self_attn.o_proj,tx.5.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.10009765625,0.2470703125,0.70556640625,0.2998046875,0.0,0.265625,0.859375,0.2998046875,0.0,0.25,1.0 39,model.layers.5.mlp.gate_proj,tx.5.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.23828125,0.2998046875,0.36669921875,0.2998046875,0.0,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 40,model.layers.5.mlp.up_proj,tx.5.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.244140625,0.2998046875,0.38037109375,0.2998046875,0.0546875,0.296875,1.0,0.2998046875,0.0,0.3125,0.9375 41,model.layers.5.mlp.down_proj,tx.5.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.24267578125,0.2998046875,0.37939453125,0.2999442219734192,0.0,0.296875,0.6953125,0.2999442219734192,0.0,0.3125,0.875 42,model.layers.6.self_attn.q_proj,tx.6.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.22998046875,0.2998046875,0.37109375,0.2998046875,0.0,0.3125,0.6484375,0.2998046875,0.0,0.3125,0.875 43,model.layers.6.self_attn.k_proj,tx.6.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2216796875,0.2998046875,0.3720703125,0.2998046875,0.0,0.3125,0.71875,0.2998046875,0.0,0.3125,0.875 44,model.layers.6.self_attn.v_proj,tx.6.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.236328125,0.29931640625,0.37255859375,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 45,model.layers.6.self_attn.o_proj,tx.6.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.13427734375,0.28369140625,0.56689453125,0.2998046875,0.0078125,0.28125,0.7890625,0.2998046875,0.0,0.3125,1.0 46,model.layers.6.mlp.gate_proj,tx.6.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24462890625,0.2998046875,0.3681640625,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 47,model.layers.6.mlp.up_proj,tx.6.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.248046875,0.2998046875,0.373046875,0.2998046875,0.046875,0.296875,1.0,0.2998046875,0.0,0.3125,0.9375 48,model.layers.6.mlp.down_proj,tx.6.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.23876953125,0.2998046875,0.37548828125,0.2999442219734192,0.0,0.296875,0.734375,0.2999442219734192,0.0,0.3125,0.875 49,model.layers.7.self_attn.q_proj,tx.7.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.22900390625,0.2998046875,0.3681640625,0.2998046875,0.0,0.3046875,0.65625,0.2998046875,0.0,0.3125,0.875 50,model.layers.7.self_attn.k_proj,tx.7.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23876953125,0.30078125,0.3642578125,0.2998046875,0.0,0.3125,0.734375,0.2998046875,0.0,0.3125,0.875 51,model.layers.7.self_attn.v_proj,tx.7.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2412109375,0.29931640625,0.369140625,0.2998046875,0.0078125,0.3046875,0.9921875,0.2998046875,0.0,0.3125,0.875 52,model.layers.7.self_attn.o_proj,tx.7.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.19091796875,0.294921875,0.45068359375,0.2998046875,0.0,0.3046875,0.7265625,0.2998046875,0.0,0.3125,0.875 53,model.layers.7.mlp.gate_proj,tx.7.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.244140625,0.30029296875,0.34375,0.2998046875,0.0078125,0.3046875,0.515625,0.2998046875,0.0,0.3125,0.875 54,model.layers.7.mlp.up_proj,tx.7.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.23681640625,0.2998046875,0.3505859375,0.2998046875,0.03125,0.3046875,0.5,0.2998046875,0.0,0.3125,0.9375 55,model.layers.7.mlp.down_proj,tx.7.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.23388671875,0.2998046875,0.37109375,0.2999442219734192,0.0,0.296875,0.7265625,0.2999442219734192,0.0,0.3125,0.9375 56,model.layers.8.self_attn.q_proj,tx.8.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23095703125,0.2998046875,0.3603515625,0.2998046875,0.0,0.3046875,0.6171875,0.2998046875,0.0,0.3125,0.875 57,model.layers.8.self_attn.k_proj,tx.8.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22900390625,0.2998046875,0.357421875,0.2998046875,0.0,0.3046875,0.6484375,0.2998046875,0.0,0.3125,0.875 58,model.layers.8.self_attn.v_proj,tx.8.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.24462890625,0.2998046875,0.37109375,0.2998046875,0.015625,0.3046875,0.9921875,0.2998046875,0.0,0.3125,0.8125 59,model.layers.8.self_attn.o_proj,tx.8.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.15673828125,0.29248046875,0.51708984375,0.2998046875,0.0,0.2890625,0.6953125,0.2998046875,0.0,0.3125,0.9375 60,model.layers.8.mlp.gate_proj,tx.8.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24267578125,0.30029296875,0.37060546875,0.2998046875,0.0,0.3046875,1.0,0.2998046875,0.0,0.3125,0.9375 61,model.layers.8.mlp.up_proj,tx.8.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24560546875,0.2998046875,0.3681640625,0.2998046875,0.0234375,0.296875,1.0,0.2998046875,0.0,0.3125,0.875 62,model.layers.8.mlp.down_proj,tx.8.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.2353515625,0.2998046875,0.37060546875,0.2999442219734192,0.03125,0.296875,0.703125,0.2999442219734192,0.0,0.3125,0.9375 63,model.layers.9.self_attn.q_proj,tx.9.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.2314453125,0.30029296875,0.35693359375,0.2998046875,0.0,0.3046875,0.625,0.2998046875,0.0,0.3125,0.875 64,model.layers.9.self_attn.k_proj,tx.9.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23291015625,0.2998046875,0.35595703125,0.2998046875,0.0,0.3046875,0.71875,0.2998046875,0.0,0.3125,0.8125 65,model.layers.9.self_attn.v_proj,tx.9.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.24609375,0.29931640625,0.36669921875,0.2998046875,0.0078125,0.296875,0.9921875,0.2998046875,0.0,0.3125,0.875 66,model.layers.9.self_attn.o_proj,tx.9.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.15771484375,0.29052734375,0.54150390625,0.2998046875,0.0078125,0.296875,0.7265625,0.2998046875,0.0,0.3125,0.9375 67,model.layers.9.mlp.gate_proj,tx.9.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.23828125,0.30029296875,0.34619140625,0.2998046875,0.0,0.3046875,0.5078125,0.2998046875,0.0,0.3125,0.9375 68,model.layers.9.mlp.up_proj,tx.9.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24853515625,0.30029296875,0.34228515625,0.2998046875,0.015625,0.3046875,0.5234375,0.2998046875,0.0,0.3125,0.875 69,model.layers.9.mlp.down_proj,tx.9.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.2275390625,0.2998046875,0.36181640625,0.2999442219734192,0.0,0.296875,0.671875,0.2999442219734192,0.0,0.3125,0.875 70,model.layers.10.self_attn.q_proj,tx.10.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.2314453125,0.30029296875,0.36181640625,0.2998046875,0.0,0.3046875,0.5859375,0.2998046875,0.0,0.3125,0.875 71,model.layers.10.self_attn.k_proj,tx.10.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22998046875,0.30029296875,0.3583984375,0.2998046875,0.0,0.3046875,0.7109375,0.2998046875,0.0,0.3125,0.875 72,model.layers.10.self_attn.v_proj,tx.10.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.236328125,0.2998046875,0.357421875,0.2998046875,0.0078125,0.296875,0.9921875,0.2998046875,0.0,0.3125,0.8125 73,model.layers.10.self_attn.o_proj,tx.10.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.1318359375,0.27099609375,0.5927734375,0.2998046875,0.0,0.28125,0.765625,0.2998046875,0.0,0.3125,1.0 74,model.layers.10.mlp.gate_proj,tx.10.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2451171875,0.30029296875,0.3466796875,0.2998046875,0.0078125,0.3046875,0.515625,0.2998046875,0.0,0.3125,0.9375 75,model.layers.10.mlp.up_proj,tx.10.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2529296875,0.30029296875,0.35107421875,0.2998046875,0.0234375,0.296875,0.5390625,0.2998046875,0.0,0.3125,0.875 76,model.layers.10.mlp.down_proj,tx.10.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.23291015625,0.30029296875,0.3662109375,0.2999442219734192,0.0,0.296875,0.640625,0.2999442219734192,0.0,0.3125,1.0 77,model.layers.11.self_attn.q_proj,tx.11.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.2265625,0.30029296875,0.35595703125,0.2998046875,0.0,0.3046875,0.6640625,0.2998046875,0.0,0.3125,0.875 78,model.layers.11.self_attn.k_proj,tx.11.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2373046875,0.30029296875,0.36181640625,0.2998046875,0.0,0.3046875,0.765625,0.2998046875,0.0,0.3125,0.8125 79,model.layers.11.self_attn.v_proj,tx.11.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.24072265625,0.2998046875,0.35693359375,0.2998046875,0.0234375,0.296875,0.9921875,0.2998046875,0.0,0.3125,0.875 80,model.layers.11.self_attn.o_proj,tx.11.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.166015625,0.28173828125,0.59228515625,0.2998046875,0.0078125,0.2890625,0.7578125,0.2998046875,0.0,0.3125,1.0 81,model.layers.11.mlp.gate_proj,tx.11.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.23974609375,0.30029296875,0.34375,0.2998046875,0.0078125,0.3046875,0.515625,0.2998046875,0.0,0.3125,0.875 82,model.layers.11.mlp.up_proj,tx.11.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24072265625,0.30029296875,0.3505859375,0.2998046875,0.03125,0.3046875,0.5546875,0.2998046875,0.0,0.3125,0.875 83,model.layers.11.mlp.down_proj,tx.11.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.228515625,0.2998046875,0.36669921875,0.2999442219734192,0.0,0.3046875,0.78125,0.2999442219734192,0.0,0.3125,0.875 84,model.layers.12.self_attn.q_proj,tx.12.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.228515625,0.30029296875,0.35693359375,0.2998046875,0.0,0.3046875,0.6171875,0.2998046875,0.0,0.3125,0.875 85,model.layers.12.self_attn.k_proj,tx.12.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22509765625,0.30029296875,0.35302734375,0.2998046875,0.0,0.3046875,0.734375,0.2998046875,0.0,0.3125,0.875 86,model.layers.12.self_attn.v_proj,tx.12.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.24267578125,0.29931640625,0.36572265625,0.2998046875,0.0234375,0.296875,0.9921875,0.2998046875,0.0,0.3125,0.8125 87,model.layers.12.self_attn.o_proj,tx.12.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.12744140625,0.30078125,0.47216796875,0.2998046875,0.0078125,0.3046875,0.625,0.2998046875,0.0,0.3125,0.9375 88,model.layers.12.mlp.gate_proj,tx.12.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2421875,0.30029296875,0.3447265625,0.2998046875,0.0,0.3046875,0.5078125,0.2998046875,0.0,0.3125,0.875 89,model.layers.12.mlp.up_proj,tx.12.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2470703125,0.30029296875,0.3447265625,0.2998046875,0.0234375,0.3046875,0.515625,0.2998046875,0.0,0.3125,0.9375 90,model.layers.12.mlp.down_proj,tx.12.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.2275390625,0.2998046875,0.3681640625,0.2999442219734192,0.0,0.3046875,0.6640625,0.2999442219734192,0.0,0.3125,0.875 91,model.layers.13.self_attn.q_proj,tx.13.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.2392578125,0.2998046875,0.35888671875,0.2998046875,0.0,0.3046875,0.6640625,0.2998046875,0.0,0.3125,0.875 92,model.layers.13.self_attn.k_proj,tx.13.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2275390625,0.29931640625,0.3544921875,0.2998046875,0.0,0.3046875,0.7890625,0.2998046875,0.0,0.3125,0.8125 93,model.layers.13.self_attn.v_proj,tx.13.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.248046875,0.29931640625,0.36572265625,0.2998046875,0.015625,0.296875,0.9921875,0.2998046875,0.0,0.3125,0.9375 94,model.layers.13.self_attn.o_proj,tx.13.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.150390625,0.29296875,0.525390625,0.2998046875,0.0,0.296875,0.6953125,0.2998046875,0.0,0.3125,0.9375 95,model.layers.13.mlp.gate_proj,tx.13.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24365234375,0.30029296875,0.349609375,0.2998046875,0.0,0.3046875,0.515625,0.2998046875,0.0,0.3125,0.9375 96,model.layers.13.mlp.up_proj,tx.13.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25,0.30029296875,0.34326171875,0.2998046875,0.015625,0.3046875,0.5078125,0.2998046875,0.0,0.3125,0.9375 97,model.layers.13.mlp.down_proj,tx.13.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22802734375,0.2998046875,0.3798828125,0.2999442219734192,0.0,0.3046875,0.734375,0.2999442219734192,0.0,0.3125,0.9375 98,model.layers.14.self_attn.q_proj,tx.14.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23193359375,0.30029296875,0.361328125,0.2998046875,0.0,0.3046875,0.59375,0.2998046875,0.0,0.3125,0.875 99,model.layers.14.self_attn.k_proj,tx.14.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.234375,0.2998046875,0.3525390625,0.2998046875,0.0,0.3046875,0.8359375,0.2998046875,0.0,0.3125,0.8125 100,model.layers.14.self_attn.v_proj,tx.14.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23779296875,0.2998046875,0.3720703125,0.2998046875,0.0078125,0.3046875,0.9921875,0.2998046875,0.0,0.3125,0.875 101,model.layers.14.self_attn.o_proj,tx.14.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.16064453125,0.28955078125,0.5732421875,0.2998046875,0.0,0.2890625,0.75,0.2998046875,0.0,0.3125,1.0 102,model.layers.14.mlp.gate_proj,tx.14.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24169921875,0.30029296875,0.34619140625,0.2998046875,0.0,0.3046875,0.5078125,0.2998046875,0.0,0.3125,1.0 103,model.layers.14.mlp.up_proj,tx.14.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.240234375,0.2998046875,0.34228515625,0.2998046875,0.0,0.3046875,0.5078125,0.2998046875,0.0,0.3125,0.9375 104,model.layers.14.mlp.down_proj,tx.14.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22119140625,0.30029296875,0.37060546875,0.2999442219734192,0.015625,0.296875,0.671875,0.2999442219734192,0.0,0.3125,0.9375 105,model.layers.15.self_attn.q_proj,tx.15.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23828125,0.30029296875,0.357421875,0.2998046875,0.0,0.3046875,0.59375,0.2998046875,0.0,0.3125,0.875 106,model.layers.15.self_attn.k_proj,tx.15.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.236328125,0.30029296875,0.3525390625,0.2998046875,0.0,0.3046875,0.7578125,0.2998046875,0.0,0.3125,0.875 107,model.layers.15.self_attn.v_proj,tx.15.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.232421875,0.2998046875,0.37451171875,0.2998046875,0.015625,0.3046875,1.0,0.2998046875,0.0,0.3125,0.8125 108,model.layers.15.self_attn.o_proj,tx.15.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.1240234375,0.2705078125,0.6328125,0.2998046875,0.0078125,0.2734375,0.7734375,0.2998046875,0.0,0.25,1.0 109,model.layers.15.mlp.gate_proj,tx.15.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.240234375,0.30029296875,0.35400390625,0.2998046875,0.0,0.3046875,0.5234375,0.2998046875,0.0,0.3125,0.9375 110,model.layers.15.mlp.up_proj,tx.15.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.248046875,0.2998046875,0.3447265625,0.2998046875,0.015625,0.3046875,0.515625,0.2998046875,0.0,0.3125,0.875 111,model.layers.15.mlp.down_proj,tx.15.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22900390625,0.2998046875,0.375,0.2999442219734192,0.015625,0.296875,0.7265625,0.2999442219734192,0.0,0.3125,0.875 112,model.layers.16.self_attn.q_proj,tx.16.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23779296875,0.30029296875,0.357421875,0.2998046875,0.0,0.3046875,0.640625,0.2998046875,0.0,0.3125,0.8125 113,model.layers.16.self_attn.k_proj,tx.16.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.232421875,0.30029296875,0.35009765625,0.2998046875,0.0,0.3046875,0.7578125,0.2998046875,0.0,0.3125,0.875 114,model.layers.16.self_attn.v_proj,tx.16.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23046875,0.29931640625,0.36572265625,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.8125 115,model.layers.16.self_attn.o_proj,tx.16.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.11962890625,0.2841796875,0.5732421875,0.2998046875,0.0078125,0.2890625,0.7421875,0.2998046875,0.0,0.3125,1.0 116,model.layers.16.mlp.gate_proj,tx.16.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24609375,0.30029296875,0.34814453125,0.2998046875,0.0,0.3046875,0.53125,0.2998046875,0.0,0.3125,0.9375 117,model.layers.16.mlp.up_proj,tx.16.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25,0.2998046875,0.349609375,0.2998046875,0.0078125,0.3046875,0.5390625,0.2998046875,0.0,0.3125,0.875 118,model.layers.16.mlp.down_proj,tx.16.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.23486328125,0.2998046875,0.37255859375,0.2999442219734192,0.0078125,0.296875,0.640625,0.2999442219734192,0.0,0.3125,0.9375 119,model.layers.17.self_attn.q_proj,tx.17.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23193359375,0.2998046875,0.3564453125,0.2998046875,0.0,0.3046875,0.59375,0.2998046875,0.0,0.3125,0.875 120,model.layers.17.self_attn.k_proj,tx.17.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2431640625,0.30029296875,0.35595703125,0.2998046875,0.0,0.3125,0.734375,0.2998046875,0.0,0.3125,0.8125 121,model.layers.17.self_attn.v_proj,tx.17.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.24658203125,0.2998046875,0.369140625,0.2998046875,0.015625,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 122,model.layers.17.self_attn.o_proj,tx.17.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.13037109375,0.279296875,0.64697265625,0.2998046875,0.0078125,0.28125,0.8203125,0.2998046875,0.0,0.25,1.0 123,model.layers.17.mlp.gate_proj,tx.17.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24365234375,0.2998046875,0.34326171875,0.2998046875,0.0,0.3046875,0.5859375,0.2998046875,0.0,0.3125,0.9375 124,model.layers.17.mlp.up_proj,tx.17.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2412109375,0.2998046875,0.34521484375,0.2998046875,0.0,0.3046875,0.5859375,0.2998046875,0.0,0.3125,0.875 125,model.layers.17.mlp.down_proj,tx.17.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22705078125,0.2998046875,0.3828125,0.2999442219734192,0.0234375,0.3046875,0.8046875,0.2999442219734192,0.0,0.3125,0.875 126,model.layers.18.self_attn.q_proj,tx.18.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.2353515625,0.30029296875,0.357421875,0.2998046875,0.0,0.3046875,0.71875,0.2998046875,0.0,0.3125,0.875 127,model.layers.18.self_attn.k_proj,tx.18.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23779296875,0.30078125,0.3583984375,0.2998046875,0.0,0.3125,0.7890625,0.2998046875,0.0,0.3125,0.8125 128,model.layers.18.self_attn.v_proj,tx.18.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23095703125,0.2998046875,0.37255859375,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.8125 129,model.layers.18.self_attn.o_proj,tx.18.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.1220703125,0.23291015625,0.77880859375,0.2998046875,0.0,0.25,0.96875,0.2998046875,0.0,0.25,1.0 130,model.layers.18.mlp.gate_proj,tx.18.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24365234375,0.2998046875,0.3505859375,0.2998046875,0.0,0.3046875,0.5625,0.2998046875,0.0,0.3125,0.875 131,model.layers.18.mlp.up_proj,tx.18.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2509765625,0.2998046875,0.34228515625,0.2998046875,0.015625,0.3046875,0.625,0.2998046875,0.0,0.3125,0.9375 132,model.layers.18.mlp.down_proj,tx.18.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22998046875,0.2998046875,0.365234375,0.2999442219734192,0.0,0.3046875,0.6484375,0.2999442219734192,0.0,0.3125,0.875 133,model.layers.19.self_attn.q_proj,tx.19.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23779296875,0.30029296875,0.357421875,0.2998046875,0.0,0.3046875,0.6328125,0.2998046875,0.0,0.3125,0.875 134,model.layers.19.self_attn.k_proj,tx.19.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22900390625,0.30029296875,0.361328125,0.2998046875,0.0,0.3125,0.796875,0.2998046875,0.0,0.3125,0.875 135,model.layers.19.self_attn.v_proj,tx.19.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23828125,0.29931640625,0.37646484375,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 136,model.layers.19.self_attn.o_proj,tx.19.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.0908203125,0.2783203125,0.72607421875,0.2998046875,0.0,0.28125,0.90625,0.2998046875,0.0,0.25,1.0 137,model.layers.19.mlp.gate_proj,tx.19.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2412109375,0.2998046875,0.34375,0.2998046875,0.0,0.3046875,0.5703125,0.2998046875,0.0,0.3125,0.9375 138,model.layers.19.mlp.up_proj,tx.19.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2509765625,0.2998046875,0.34375,0.2998046875,0.0078125,0.3046875,0.625,0.2998046875,0.0,0.3125,0.9375 139,model.layers.19.mlp.down_proj,tx.19.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22705078125,0.2998046875,0.37109375,0.2999442219734192,0.0078125,0.3046875,0.625,0.2999442219734192,0.0,0.3125,0.875 140,model.layers.20.self_attn.q_proj,tx.20.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.234375,0.30029296875,0.35107421875,0.2998046875,0.0,0.3046875,0.578125,0.2998046875,0.0,0.3125,0.8125 141,model.layers.20.self_attn.k_proj,tx.20.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23193359375,0.30078125,0.35546875,0.2998046875,0.0,0.3125,0.7734375,0.2998046875,0.0,0.3125,0.875 142,model.layers.20.self_attn.v_proj,tx.20.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23974609375,0.30029296875,0.3779296875,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.8125 143,model.layers.20.self_attn.o_proj,tx.20.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.12451171875,0.2587890625,0.7373046875,0.2998046875,0.0,0.265625,0.921875,0.2998046875,0.0,0.25,1.0 144,model.layers.20.mlp.gate_proj,tx.20.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24755859375,0.2998046875,0.34423828125,0.2998046875,0.0,0.3046875,0.59375,0.2998046875,0.0,0.3125,0.875 145,model.layers.20.mlp.up_proj,tx.20.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25341796875,0.2998046875,0.34375,0.2998046875,0.015625,0.3046875,0.6328125,0.2998046875,0.0,0.3125,0.875 146,model.layers.20.mlp.down_proj,tx.20.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.23583984375,0.30029296875,0.3671875,0.2999442219734192,0.0,0.3046875,0.625,0.2999442219734192,0.0,0.3125,0.875 147,model.layers.21.self_attn.q_proj,tx.21.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.2294921875,0.30029296875,0.35400390625,0.2998046875,0.0,0.3046875,0.53125,0.2998046875,0.0,0.3125,1.0 148,model.layers.21.self_attn.k_proj,tx.21.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22998046875,0.30029296875,0.36474609375,0.2998046875,0.0,0.3125,0.71875,0.2998046875,0.0,0.3125,0.8125 149,model.layers.21.self_attn.v_proj,tx.21.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.24169921875,0.2998046875,0.376953125,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 150,model.layers.21.self_attn.o_proj,tx.21.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.10009765625,0.2607421875,0.7841796875,0.2998046875,0.0,0.2734375,0.9765625,0.2998046875,0.0,0.25,1.0 151,model.layers.21.mlp.gate_proj,tx.21.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24853515625,0.2998046875,0.34228515625,0.2998046875,0.0,0.3046875,0.6015625,0.2998046875,0.0,0.3125,0.875 152,model.layers.21.mlp.up_proj,tx.21.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24560546875,0.2998046875,0.345703125,0.2998046875,0.015625,0.3046875,0.6328125,0.2998046875,0.0,0.3125,0.875 153,model.layers.21.mlp.down_proj,tx.21.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.2265625,0.2998046875,0.3671875,0.2999442219734192,0.015625,0.3046875,0.6171875,0.2999442219734192,0.0,0.3125,0.875 154,model.layers.22.self_attn.q_proj,tx.22.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23486328125,0.30029296875,0.3564453125,0.2998046875,0.0,0.3046875,0.546875,0.2998046875,0.0,0.3125,0.875 155,model.layers.22.self_attn.k_proj,tx.22.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.232421875,0.2998046875,0.359375,0.2998046875,0.0,0.3125,0.765625,0.2998046875,0.0,0.3125,0.8125 156,model.layers.22.self_attn.v_proj,tx.22.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2353515625,0.2998046875,0.36669921875,0.2998046875,0.015625,0.3046875,1.0,0.2998046875,0.0,0.3125,0.8125 157,model.layers.22.self_attn.o_proj,tx.22.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.1240234375,0.2919921875,0.59521484375,0.2998046875,0.0078125,0.2890625,0.78125,0.2998046875,0.0,0.3125,1.0 158,model.layers.22.mlp.gate_proj,tx.22.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25,0.30029296875,0.34619140625,0.2998046875,0.0,0.3046875,0.5859375,0.2998046875,0.0,0.3125,0.875 159,model.layers.22.mlp.up_proj,tx.22.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25341796875,0.2998046875,0.34619140625,0.2998046875,0.0,0.296875,0.640625,0.2998046875,0.0,0.3125,0.875 160,model.layers.22.mlp.down_proj,tx.22.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22021484375,0.2998046875,0.369140625,0.2999442219734192,0.0,0.3046875,0.5703125,0.2999442219734192,0.0,0.3125,0.875 161,model.layers.23.self_attn.q_proj,tx.23.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.22705078125,0.30029296875,0.3583984375,0.2998046875,0.0,0.3046875,0.546875,0.2998046875,0.0,0.3125,0.875 162,model.layers.23.self_attn.k_proj,tx.23.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23876953125,0.30078125,0.3583984375,0.2998046875,0.0,0.3125,0.765625,0.2998046875,0.0,0.3125,0.8125 163,model.layers.23.self_attn.v_proj,tx.23.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2392578125,0.2998046875,0.37109375,0.2998046875,0.015625,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 164,model.layers.23.self_attn.o_proj,tx.23.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.103515625,0.29150390625,0.55322265625,0.2998046875,0.0,0.2890625,0.7265625,0.2998046875,0.0,0.3125,0.9375 165,model.layers.23.mlp.gate_proj,tx.23.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24951171875,0.2998046875,0.34619140625,0.2998046875,0.0,0.3046875,0.640625,0.2998046875,0.0,0.3125,0.875 166,model.layers.23.mlp.up_proj,tx.23.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2490234375,0.2998046875,0.34912109375,0.2998046875,0.015625,0.296875,0.6484375,0.2998046875,0.0,0.3125,0.875 167,model.layers.23.mlp.down_proj,tx.23.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.21533203125,0.30029296875,0.3642578125,0.2999442219734192,0.0,0.3125,0.5859375,0.2999442219734192,0.0,0.3125,0.875 168,model.layers.24.self_attn.q_proj,tx.24.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23486328125,0.30029296875,0.35498046875,0.2998046875,0.0,0.3125,0.59375,0.2998046875,0.0,0.3125,0.875 169,model.layers.24.self_attn.k_proj,tx.24.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.234375,0.30029296875,0.3544921875,0.2998046875,0.0,0.3125,0.765625,0.2998046875,0.0,0.3125,0.875 170,model.layers.24.self_attn.v_proj,tx.24.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23388671875,0.2998046875,0.373046875,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 171,model.layers.24.self_attn.o_proj,tx.24.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.10693359375,0.26318359375,0.61572265625,0.2998046875,0.0,0.2734375,0.8125,0.2998046875,0.0,0.3125,1.0 172,model.layers.24.mlp.gate_proj,tx.24.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25,0.30029296875,0.34814453125,0.2998046875,0.0,0.3046875,0.625,0.2998046875,0.0,0.3125,0.875 173,model.layers.24.mlp.up_proj,tx.24.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2431640625,0.30029296875,0.34423828125,0.2998046875,0.015625,0.296875,0.6484375,0.2998046875,0.0,0.3125,0.9375 174,model.layers.24.mlp.down_proj,tx.24.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.22509765625,0.30078125,0.369140625,0.2999442219734192,0.0,0.3125,0.578125,0.2999442219734192,0.0,0.3125,0.875 175,model.layers.25.self_attn.q_proj,tx.25.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23291015625,0.2998046875,0.35693359375,0.2998046875,0.0,0.3125,0.546875,0.2998046875,0.0,0.3125,0.9375 176,model.layers.25.self_attn.k_proj,tx.25.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2216796875,0.30029296875,0.36767578125,0.2998046875,0.0,0.3125,0.7421875,0.2998046875,0.0,0.3125,0.8125 177,model.layers.25.self_attn.v_proj,tx.25.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.236328125,0.2998046875,0.3681640625,0.2998046875,0.0,0.3046875,1.0,0.2998046875,0.0,0.3125,0.8125 178,model.layers.25.self_attn.o_proj,tx.25.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.10107421875,0.248046875,0.81982421875,0.2998046875,0.0078125,0.2578125,0.9609375,0.2998046875,0.0,0.25,1.0 179,model.layers.25.mlp.gate_proj,tx.25.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24951171875,0.2998046875,0.34521484375,0.2998046875,0.0,0.3046875,0.609375,0.2998046875,0.0,0.3125,0.875 180,model.layers.25.mlp.up_proj,tx.25.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.248046875,0.2998046875,0.34375,0.2998046875,0.0,0.296875,0.6328125,0.2998046875,0.0,0.3125,0.9375 181,model.layers.25.mlp.down_proj,tx.25.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.2119140625,0.30029296875,0.37109375,0.2999442219734192,0.0078125,0.3125,0.578125,0.2999442219734192,0.0,0.3125,0.9375 182,model.layers.26.self_attn.q_proj,tx.26.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23583984375,0.30029296875,0.35693359375,0.2998046875,0.0,0.3125,0.5390625,0.2998046875,0.0,0.3125,0.875 183,model.layers.26.self_attn.k_proj,tx.26.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22998046875,0.30029296875,0.365234375,0.2998046875,0.0,0.3125,0.765625,0.2998046875,0.0,0.3125,0.8125 184,model.layers.26.self_attn.v_proj,tx.26.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23681640625,0.29931640625,0.38134765625,0.2998046875,0.0,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 185,model.layers.26.self_attn.o_proj,tx.26.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.111328125,0.259765625,0.65185546875,0.2998046875,0.0,0.2578125,0.8046875,0.2998046875,0.0,0.25,1.0 186,model.layers.26.mlp.gate_proj,tx.26.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24951171875,0.2998046875,0.34375,0.2998046875,0.0,0.3046875,0.640625,0.2998046875,0.0,0.3125,0.875 187,model.layers.26.mlp.up_proj,tx.26.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2451171875,0.2998046875,0.3505859375,0.2998046875,0.0078125,0.296875,0.625,0.2998046875,0.0,0.3125,0.875 188,model.layers.26.mlp.down_proj,tx.26.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.21142578125,0.30078125,0.37060546875,0.2999442219734192,0.0,0.3125,0.6171875,0.2999442219734192,0.0,0.3125,0.9375 189,model.layers.27.self_attn.q_proj,tx.27.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.23486328125,0.30029296875,0.3740234375,0.2998046875,0.0,0.3125,1.0,0.2998046875,0.0,0.3125,0.875 190,model.layers.27.self_attn.k_proj,tx.27.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2353515625,0.30029296875,0.37451171875,0.2998046875,0.0,0.3125,1.0,0.2998046875,0.0,0.3125,0.8125 191,model.layers.27.self_attn.v_proj,tx.27.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.23779296875,0.2998046875,0.37548828125,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.8125 192,model.layers.27.self_attn.o_proj,tx.27.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.10791015625,0.27587890625,0.61572265625,0.2998046875,0.0,0.265625,0.796875,0.2998046875,0.0,0.25,1.0 193,model.layers.27.mlp.gate_proj,tx.27.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.2470703125,0.2998046875,0.3505859375,0.2998046875,0.0,0.3046875,0.609375,0.2998046875,0.0,0.3125,0.9375 194,model.layers.27.mlp.up_proj,tx.27.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25341796875,0.2998046875,0.34619140625,0.2998046875,0.0,0.296875,0.671875,0.2998046875,0.0,0.3125,0.9375 195,model.layers.27.mlp.down_proj,tx.27.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.21826171875,0.30029296875,0.36962890625,0.2999442219734192,0.0,0.3125,0.546875,0.2999442219734192,0.0,0.3125,0.9375 196,model.layers.28.self_attn.q_proj,tx.28.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.22216796875,0.30078125,0.3564453125,0.2998046875,0.0,0.3125,0.5234375,0.2998046875,0.0,0.3125,0.875 197,model.layers.28.self_attn.k_proj,tx.28.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.232421875,0.2998046875,0.35498046875,0.2998046875,0.0,0.3125,0.78125,0.2998046875,0.0,0.3125,0.8125 198,model.layers.28.self_attn.v_proj,tx.28.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2470703125,0.2998046875,0.36865234375,0.2998046875,0.015625,0.3046875,1.0,0.2998046875,0.0,0.3125,0.8125 199,model.layers.28.self_attn.o_proj,tx.28.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.09423828125,0.2880859375,0.67041015625,0.2998046875,0.015625,0.2890625,0.7734375,0.2998046875,0.0,0.3125,1.0 200,model.layers.28.mlp.gate_proj,tx.28.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24365234375,0.30029296875,0.3466796875,0.2998046875,0.0,0.3046875,0.609375,0.2998046875,0.0,0.3125,0.875 201,model.layers.28.mlp.up_proj,tx.28.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24609375,0.2998046875,0.3515625,0.2998046875,0.0078125,0.3046875,0.59375,0.2998046875,0.0,0.3125,0.875 202,model.layers.28.mlp.down_proj,tx.28.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.208984375,0.30078125,0.3759765625,0.2999442219734192,0.0078125,0.3203125,0.5703125,0.2999442219734192,0.0,0.3125,0.875 203,model.layers.29.self_attn.q_proj,tx.29.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.22802734375,0.30029296875,0.38525390625,0.2998046875,0.0,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 204,model.layers.29.self_attn.k_proj,tx.29.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22705078125,0.30029296875,0.36474609375,0.2998046875,0.0,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 205,model.layers.29.self_attn.v_proj,tx.29.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2412109375,0.29931640625,0.3623046875,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 206,model.layers.29.self_attn.o_proj,tx.29.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.0693359375,0.330078125,0.55615234375,0.2998046875,0.0,0.3046875,0.703125,0.2998046875,0.0,0.3125,1.0 207,model.layers.29.mlp.gate_proj,tx.29.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24462890625,0.2998046875,0.34423828125,0.2998046875,0.0,0.3046875,0.6171875,0.2998046875,0.0,0.3125,0.875 208,model.layers.29.mlp.up_proj,tx.29.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24560546875,0.30029296875,0.34912109375,0.2998046875,0.0078125,0.3046875,0.625,0.2998046875,0.0,0.3125,0.875 209,model.layers.29.mlp.down_proj,tx.29.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.2236328125,0.30078125,0.37548828125,0.2999442219734192,0.0,0.3125,0.59375,0.2999442219734192,0.0,0.3125,0.875 210,model.layers.30.self_attn.q_proj,tx.30.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.2177734375,0.30029296875,0.3544921875,0.2998046875,0.0,0.3125,0.5390625,0.2998046875,0.0,0.3125,0.875 211,model.layers.30.self_attn.k_proj,tx.30.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22509765625,0.30126953125,0.3603515625,0.2998046875,0.0,0.3125,0.78125,0.2998046875,0.0,0.3125,0.875 212,model.layers.30.self_attn.v_proj,tx.30.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22802734375,0.2998046875,0.3837890625,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 213,model.layers.30.self_attn.o_proj,tx.30.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.0869140625,0.271484375,0.8271484375,0.2998046875,0.0234375,0.2734375,0.9453125,0.2998046875,0.0,0.25,1.0 214,model.layers.30.mlp.gate_proj,tx.30.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25048828125,0.30029296875,0.35205078125,0.2998046875,0.0078125,0.3046875,0.703125,0.2998046875,0.0,0.3125,0.9375 215,model.layers.30.mlp.up_proj,tx.30.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25048828125,0.30029296875,0.35009765625,0.2998046875,0.0,0.3046875,0.6640625,0.2998046875,0.0,0.3125,0.9375 216,model.layers.30.mlp.down_proj,tx.30.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.21142578125,0.30078125,0.38427734375,0.2999442219734192,0.0,0.3203125,0.65625,0.2999442219734192,0.0,0.3125,0.875 217,model.layers.31.self_attn.q_proj,tx.31.attn.q,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.21826171875,0.30029296875,0.3603515625,0.2998046875,0.0,0.3046875,0.8203125,0.2998046875,0.0,0.3125,0.9375 218,model.layers.31.self_attn.k_proj,tx.31.attn.k,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.22607421875,0.2998046875,0.3525390625,0.2998046875,0.0,0.3125,0.8359375,0.2998046875,0.0,0.3125,0.8125 219,model.layers.31.self_attn.v_proj,tx.31.attn.v,Linear,weight,"[1024, 4096]",4194304,2936832,0.2998046875,"(128, 16)",8 x 256,2048,0.2998046875,0.2138671875,0.2998046875,0.36279296875,0.2998046875,0.0078125,0.3046875,1.0,0.2998046875,0.0,0.3125,0.875 220,model.layers.31.self_attn.o_proj,tx.31.attn.o,Linear,weight,"[4096, 4096]",16777216,11747328,0.2998046875,"(128, 16)",32 x 256,8192,0.2998046875,0.0390625,0.26416015625,0.65380859375,0.2998046875,0.0,0.2734375,0.828125,0.2998046875,0.0,0.25,1.0 221,model.layers.31.mlp.gate_proj,tx.31.mlp.gate,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.25537109375,0.2998046875,0.35107421875,0.2998046875,0.0234375,0.3046875,0.7421875,0.2998046875,0.0,0.3125,0.875 222,model.layers.31.mlp.up_proj,tx.31.mlp.up,Linear,weight,"[14336, 4096]",58720256,41115648,0.2998046278953552,"(128, 16)",112 x 256,28672,0.2998046875,0.24951171875,0.2998046875,0.3466796875,0.2998046875,0.015625,0.3046875,0.6875,0.2998046875,0.0,0.3125,0.875 223,model.layers.31.mlp.down_proj,tx.31.mlp.down,Linear,weight,"[4096, 14336]",58720256,41107456,0.2999441623687744,"(128, 16)",32 x 896,28672,0.2999442219734192,0.18701171875,0.2998046875,0.404296875,0.2999442219734192,0.0,0.328125,0.765625,0.2999442219734192,0.0,0.3125,0.875 224,lm_head,lm_head,Linear,weight,"[128256, 4096]",525336576,525336576,0.0,"(128, 16)",1002 x 256,256512,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0