row,layer_id,short_id,layer_type,param_type,shape,nparam,nnz,sparsity,tile_shape,n_tile,n_tile_total,tile_avg,tile_min,tile_med,tile_max,col_avg,col_min,col_med,col_max,row_avg,row_min,row_med,row_max 0,model.layers.0.self_attn.q_proj,tx.0.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.02099609375,0.189453125,0.5751953125,0.199951171875,0.0,0.0078125,1.0,0.199951171875,0.0,0.1875,0.75 1,model.layers.0.self_attn.k_proj,tx.0.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.0361328125,0.18701171875,0.56884765625,0.199951171875,0.0,0.0078125,1.0,0.199951171875,0.0,0.1875,0.6875 2,model.layers.0.self_attn.v_proj,tx.0.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.02880859375,0.19189453125,0.53271484375,0.199951171875,0.0,0.015625,1.0,0.199951171875,0.0,0.1875,0.6875 3,model.layers.0.self_attn.o_proj,tx.0.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.01513671875,0.13525390625,0.8046875,0.199951171875,0.0,0.125,0.9453125,0.199951171875,0.0,0.125,1.0 4,model.layers.0.mlp.gate_proj,tx.0.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15625,0.197265625,0.31494140625,0.1999511867761612,0.0078125,0.1953125,1.0,0.1999511867761612,0.0,0.1875,0.8125 5,model.layers.0.mlp.up_proj,tx.0.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15771484375,0.197265625,0.318359375,0.1999511867761612,0.015625,0.1953125,1.0,0.1999511867761612,0.0,0.1875,0.8125 6,model.layers.0.mlp.down_proj,tx.0.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.12841796875,0.2001953125,0.26318359375,0.1999860554933548,0.0,0.1953125,0.4765625,0.1999860554933548,0.0,0.1875,0.8125 7,model.layers.1.self_attn.q_proj,tx.1.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.11181640625,0.19677734375,0.39453125,0.199951171875,0.0,0.1953125,1.0,0.199951171875,0.0,0.1875,0.75 8,model.layers.1.self_attn.k_proj,tx.1.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.10791015625,0.197265625,0.38427734375,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.6875 9,model.layers.1.self_attn.v_proj,tx.1.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.11328125,0.1953125,0.36669921875,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.6875 10,model.layers.1.self_attn.o_proj,tx.1.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.07080078125,0.17822265625,0.61328125,0.199951171875,0.0,0.1640625,0.859375,0.199951171875,0.0,0.1875,1.0 11,model.layers.1.mlp.gate_proj,tx.1.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.150390625,0.197265625,0.30810546875,0.1999511867761612,0.015625,0.1953125,1.0,0.1999511867761612,0.0,0.1875,0.8125 12,model.layers.1.mlp.up_proj,tx.1.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1591796875,0.197265625,0.31396484375,0.1999511867761612,0.0234375,0.1953125,1.0,0.1999511867761612,0.0,0.1875,0.75 13,model.layers.1.mlp.down_proj,tx.1.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14453125,0.2001953125,0.2685546875,0.1999860554933548,0.0,0.203125,0.4296875,0.1999860554933548,0.0,0.1875,0.75 14,model.layers.2.self_attn.q_proj,tx.2.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.1279296875,0.19921875,0.31005859375,0.199951171875,0.0,0.2109375,1.0,0.199951171875,0.0,0.1875,0.8125 15,model.layers.2.self_attn.k_proj,tx.2.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.134765625,0.19970703125,0.31103515625,0.199951171875,0.0,0.2109375,1.0,0.199951171875,0.0,0.1875,0.6875 16,model.layers.2.self_attn.v_proj,tx.2.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.150390625,0.19873046875,0.3037109375,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.6875 17,model.layers.2.self_attn.o_proj,tx.2.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.07861328125,0.17041015625,0.5810546875,0.199951171875,0.0,0.171875,0.765625,0.199951171875,0.0,0.1875,1.0 18,model.layers.2.mlp.gate_proj,tx.2.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15771484375,0.197265625,0.3154296875,0.1999511867761612,0.0234375,0.1953125,1.0,0.1999511867761612,0.0,0.1875,0.8125 19,model.layers.2.mlp.up_proj,tx.2.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15673828125,0.197265625,0.3212890625,0.1999511867761612,0.03125,0.1953125,1.0,0.1999511867761612,0.0,0.1875,0.8125 20,model.layers.2.mlp.down_proj,tx.2.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.13916015625,0.2001953125,0.26025390625,0.1999860554933548,0.0,0.203125,0.5,0.1999860554933548,0.0,0.1875,0.75 21,model.layers.3.self_attn.q_proj,tx.3.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.1474609375,0.2001953125,0.28955078125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.8125 22,model.layers.3.self_attn.k_proj,tx.3.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.14306640625,0.19970703125,0.27294921875,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 23,model.layers.3.self_attn.v_proj,tx.3.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15673828125,0.19921875,0.28173828125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 24,model.layers.3.self_attn.o_proj,tx.3.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.099609375,0.1904296875,0.3515625,0.199951171875,0.0,0.1953125,0.6015625,0.199951171875,0.0,0.1875,0.8125 25,model.layers.3.mlp.gate_proj,tx.3.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.16064453125,0.1982421875,0.31201171875,0.1999511867761612,0.0078125,0.1953125,1.0,0.1999511867761612,0.0,0.1875,0.75 26,model.layers.3.mlp.up_proj,tx.3.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15869140625,0.1982421875,0.31494140625,0.1999511867761612,0.03125,0.1953125,1.0,0.1999511867761612,0.0,0.1875,0.8125 27,model.layers.3.mlp.down_proj,tx.3.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.146484375,0.19970703125,0.25634765625,0.1999860554933548,0.0,0.203125,0.4609375,0.1999860554933548,0.0,0.1875,0.8125 28,model.layers.4.self_attn.q_proj,tx.4.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.13671875,0.2001953125,0.271484375,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 29,model.layers.4.self_attn.k_proj,tx.4.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1435546875,0.2001953125,0.2734375,0.199951171875,0.0,0.2109375,1.0,0.199951171875,0.0,0.1875,0.75 30,model.layers.4.self_attn.v_proj,tx.4.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15283203125,0.19921875,0.27734375,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 31,model.layers.4.self_attn.o_proj,tx.4.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.087890625,0.17578125,0.5419921875,0.199951171875,0.0,0.1796875,0.7265625,0.199951171875,0.0,0.1875,0.9375 32,model.layers.4.mlp.gate_proj,tx.4.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15478515625,0.19970703125,0.26953125,0.1999511867761612,0.0,0.203125,1.0,0.1999511867761612,0.0,0.1875,0.75 33,model.layers.4.mlp.up_proj,tx.4.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1572265625,0.19970703125,0.27783203125,0.1999511867761612,0.0078125,0.203125,1.0,0.1999511867761612,0.0,0.1875,0.75 34,model.layers.4.mlp.down_proj,tx.4.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.1513671875,0.19970703125,0.25732421875,0.1999860554933548,0.0,0.1953125,0.6484375,0.1999860554933548,0.0,0.1875,0.8125 35,model.layers.5.self_attn.q_proj,tx.5.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.13818359375,0.2001953125,0.25634765625,0.199951171875,0.0,0.203125,0.4921875,0.199951171875,0.0,0.1875,0.75 36,model.layers.5.self_attn.k_proj,tx.5.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.13134765625,0.19970703125,0.26318359375,0.199951171875,0.0,0.2109375,0.6171875,0.199951171875,0.0,0.1875,0.75 37,model.layers.5.self_attn.v_proj,tx.5.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15380859375,0.19970703125,0.275390625,0.199951171875,0.0078125,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.6875 38,model.layers.5.self_attn.o_proj,tx.5.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.06640625,0.16162109375,0.48193359375,0.199951171875,0.0,0.171875,0.6796875,0.199951171875,0.0,0.1875,0.9375 39,model.layers.5.mlp.gate_proj,tx.5.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15380859375,0.19970703125,0.2666015625,0.1999511867761612,0.0,0.203125,1.0,0.1999511867761612,0.0,0.1875,0.75 40,model.layers.5.mlp.up_proj,tx.5.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.16015625,0.19970703125,0.2705078125,0.1999511867761612,0.015625,0.203125,1.0,0.1999511867761612,0.0,0.1875,0.8125 41,model.layers.5.mlp.down_proj,tx.5.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.15380859375,0.19970703125,0.2666015625,0.1999860554933548,0.0,0.1953125,0.53125,0.1999860554933548,0.0,0.1875,0.75 42,model.layers.6.self_attn.q_proj,tx.6.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.1494140625,0.2001953125,0.24560546875,0.199951171875,0.0,0.203125,0.515625,0.199951171875,0.0,0.1875,0.75 43,model.layers.6.self_attn.k_proj,tx.6.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.14990234375,0.2001953125,0.24853515625,0.199951171875,0.0,0.203125,0.6484375,0.199951171875,0.0,0.1875,0.75 44,model.layers.6.self_attn.v_proj,tx.6.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1484375,0.19921875,0.27392578125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 45,model.layers.6.self_attn.o_proj,tx.6.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.08984375,0.18798828125,0.3974609375,0.199951171875,0.0,0.1875,0.5859375,0.199951171875,0.0,0.1875,0.8125 46,model.layers.6.mlp.gate_proj,tx.6.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15771484375,0.19970703125,0.27001953125,0.1999511867761612,0.0,0.203125,1.0,0.1999511867761612,0.0,0.1875,0.8125 47,model.layers.6.mlp.up_proj,tx.6.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15966796875,0.19970703125,0.2744140625,0.1999511867761612,0.015625,0.203125,1.0,0.1999511867761612,0.0,0.1875,0.8125 48,model.layers.6.mlp.down_proj,tx.6.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.1533203125,0.19970703125,0.255859375,0.1999860554933548,0.0,0.1953125,0.546875,0.1999860554933548,0.0,0.1875,0.75 49,model.layers.7.self_attn.q_proj,tx.7.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15087890625,0.2001953125,0.24560546875,0.199951171875,0.0,0.203125,0.4453125,0.199951171875,0.0,0.1875,0.8125 50,model.layers.7.self_attn.k_proj,tx.7.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.14990234375,0.2001953125,0.25634765625,0.199951171875,0.0,0.203125,0.640625,0.199951171875,0.0,0.1875,0.75 51,model.layers.7.self_attn.v_proj,tx.7.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.16015625,0.19921875,0.2705078125,0.199951171875,0.0078125,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.75 52,model.layers.7.self_attn.o_proj,tx.7.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.11865234375,0.1962890625,0.31201171875,0.199951171875,0.0,0.203125,0.515625,0.199951171875,0.0,0.1875,0.75 53,model.layers.7.mlp.gate_proj,tx.7.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15966796875,0.2001953125,0.2529296875,0.1999511867761612,0.0,0.203125,0.3671875,0.1999511867761612,0.0,0.1875,0.75 54,model.layers.7.mlp.up_proj,tx.7.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15869140625,0.2001953125,0.23876953125,0.1999511867761612,0.015625,0.203125,0.390625,0.1999511867761612,0.0,0.1875,0.75 55,model.layers.7.mlp.down_proj,tx.7.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14990234375,0.19970703125,0.25732421875,0.1999860554933548,0.0,0.1953125,0.5546875,0.1999860554933548,0.0,0.1875,0.75 56,model.layers.8.self_attn.q_proj,tx.8.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.1396484375,0.2001953125,0.25048828125,0.199951171875,0.0,0.203125,0.4921875,0.199951171875,0.0,0.1875,0.75 57,model.layers.8.self_attn.k_proj,tx.8.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1533203125,0.19970703125,0.248046875,0.199951171875,0.0,0.203125,0.515625,0.199951171875,0.0,0.1875,0.6875 58,model.layers.8.self_attn.v_proj,tx.8.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15625,0.19970703125,0.2744140625,0.199951171875,0.0,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.75 59,model.layers.8.self_attn.o_proj,tx.8.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.1005859375,0.19384765625,0.3740234375,0.199951171875,0.0,0.1953125,0.5546875,0.199951171875,0.0,0.1875,0.875 60,model.layers.8.mlp.gate_proj,tx.8.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15869140625,0.19970703125,0.26806640625,0.1999511867761612,0.0,0.203125,1.0,0.1999511867761612,0.0,0.1875,0.8125 61,model.layers.8.mlp.up_proj,tx.8.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15625,0.19970703125,0.2744140625,0.1999511867761612,0.015625,0.203125,1.0,0.1999511867761612,0.0,0.1875,0.8125 62,model.layers.8.mlp.down_proj,tx.8.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14501953125,0.19970703125,0.25537109375,0.1999860554933548,0.0078125,0.1953125,0.5546875,0.1999860554933548,0.0,0.1875,0.8125 63,model.layers.9.self_attn.q_proj,tx.9.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15283203125,0.19970703125,0.24560546875,0.199951171875,0.0,0.203125,0.46875,0.199951171875,0.0,0.1875,0.75 64,model.layers.9.self_attn.k_proj,tx.9.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15185546875,0.2001953125,0.23974609375,0.199951171875,0.0,0.203125,0.5390625,0.199951171875,0.0,0.1875,0.6875 65,model.layers.9.self_attn.v_proj,tx.9.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1611328125,0.19921875,0.26318359375,0.199951171875,0.0,0.1953125,0.9921875,0.199951171875,0.0,0.1875,0.75 66,model.layers.9.self_attn.o_proj,tx.9.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.0986328125,0.19287109375,0.39111328125,0.199951171875,0.0,0.1953125,0.5546875,0.199951171875,0.0,0.1875,0.8125 67,model.layers.9.mlp.gate_proj,tx.9.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.158203125,0.2001953125,0.23974609375,0.1999511867761612,0.0,0.203125,0.4140625,0.1999511867761612,0.0,0.1875,0.8125 68,model.layers.9.mlp.up_proj,tx.9.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15966796875,0.2001953125,0.2431640625,0.1999511867761612,0.0078125,0.203125,0.390625,0.1999511867761612,0.0,0.1875,0.75 69,model.layers.9.mlp.down_proj,tx.9.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.140625,0.2001953125,0.24658203125,0.1999860554933548,0.0,0.1953125,0.5078125,0.1999860554933548,0.0,0.1875,0.8125 70,model.layers.10.self_attn.q_proj,tx.10.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.146484375,0.2001953125,0.2490234375,0.199951171875,0.0,0.203125,0.4453125,0.199951171875,0.0,0.1875,0.75 71,model.layers.10.self_attn.k_proj,tx.10.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1484375,0.2001953125,0.2412109375,0.199951171875,0.0,0.203125,0.546875,0.199951171875,0.0,0.1875,0.6875 72,model.layers.10.self_attn.v_proj,tx.10.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.150390625,0.19970703125,0.255859375,0.199951171875,0.0,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.75 73,model.layers.10.self_attn.o_proj,tx.10.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.0849609375,0.1787109375,0.43212890625,0.199951171875,0.0,0.1875,0.609375,0.199951171875,0.0,0.1875,0.875 74,model.layers.10.mlp.gate_proj,tx.10.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1611328125,0.2001953125,0.2412109375,0.1999511867761612,0.0,0.203125,0.3828125,0.1999511867761612,0.0,0.1875,0.8125 75,model.layers.10.mlp.up_proj,tx.10.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1640625,0.2001953125,0.23681640625,0.1999511867761612,0.0078125,0.203125,0.3984375,0.1999511867761612,0.0,0.1875,0.75 76,model.layers.10.mlp.down_proj,tx.10.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14599609375,0.2001953125,0.2548828125,0.1999860554933548,0.0,0.203125,0.46875,0.1999860554933548,0.0,0.1875,0.8125 77,model.layers.11.self_attn.q_proj,tx.11.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.1484375,0.2001953125,0.2431640625,0.199951171875,0.0,0.203125,0.46875,0.199951171875,0.0,0.1875,0.75 78,model.layers.11.self_attn.k_proj,tx.11.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1572265625,0.19970703125,0.24755859375,0.199951171875,0.0,0.203125,0.6484375,0.199951171875,0.0,0.1875,0.75 79,model.layers.11.self_attn.v_proj,tx.11.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1611328125,0.19970703125,0.25341796875,0.199951171875,0.015625,0.1953125,0.9921875,0.199951171875,0.0,0.1875,0.8125 80,model.layers.11.self_attn.o_proj,tx.11.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.1064453125,0.1865234375,0.42578125,0.199951171875,0.0,0.1953125,0.578125,0.199951171875,0.0,0.1875,0.9375 81,model.layers.11.mlp.gate_proj,tx.11.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1484375,0.2001953125,0.240234375,0.1999511867761612,0.0,0.203125,0.390625,0.1999511867761612,0.0,0.1875,0.8125 82,model.layers.11.mlp.up_proj,tx.11.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15966796875,0.2001953125,0.23974609375,0.1999511867761612,0.0,0.203125,0.4140625,0.1999511867761612,0.0,0.1875,0.8125 83,model.layers.11.mlp.down_proj,tx.11.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.1494140625,0.19970703125,0.24951171875,0.1999860554933548,0.0,0.203125,0.6015625,0.1999860554933548,0.0,0.1875,0.75 84,model.layers.12.self_attn.q_proj,tx.12.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.1474609375,0.2001953125,0.24267578125,0.199951171875,0.0,0.203125,0.4609375,0.199951171875,0.0,0.1875,0.75 85,model.layers.12.self_attn.k_proj,tx.12.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1484375,0.2001953125,0.2431640625,0.199951171875,0.0,0.203125,0.6015625,0.199951171875,0.0,0.1875,0.6875 86,model.layers.12.self_attn.v_proj,tx.12.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1630859375,0.19970703125,0.26416015625,0.199951171875,0.0078125,0.1953125,0.9921875,0.199951171875,0.0,0.1875,0.75 87,model.layers.12.self_attn.o_proj,tx.12.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.0771484375,0.2001953125,0.32080078125,0.199951171875,0.0,0.203125,0.4921875,0.199951171875,0.0,0.1875,0.8125 88,model.layers.12.mlp.gate_proj,tx.12.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15771484375,0.2001953125,0.23876953125,0.1999511867761612,0.0,0.203125,0.375,0.1999511867761612,0.0,0.1875,0.75 89,model.layers.12.mlp.up_proj,tx.12.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15576171875,0.2001953125,0.23876953125,0.1999511867761612,0.0078125,0.203125,0.3984375,0.1999511867761612,0.0,0.1875,0.75 90,model.layers.12.mlp.down_proj,tx.12.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14501953125,0.19970703125,0.25341796875,0.1999860554933548,0.0,0.203125,0.484375,0.1999860554933548,0.0,0.1875,0.75 91,model.layers.13.self_attn.q_proj,tx.13.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15234375,0.2001953125,0.2490234375,0.199951171875,0.0,0.203125,0.4609375,0.199951171875,0.0,0.1875,0.75 92,model.layers.13.self_attn.k_proj,tx.13.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.146484375,0.19970703125,0.24365234375,0.199951171875,0.0,0.203125,0.6640625,0.199951171875,0.0,0.1875,0.6875 93,model.layers.13.self_attn.v_proj,tx.13.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.16357421875,0.19970703125,0.26904296875,0.199951171875,0.015625,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.6875 94,model.layers.13.self_attn.o_proj,tx.13.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.095703125,0.193359375,0.3701171875,0.199951171875,0.0,0.1953125,0.5234375,0.199951171875,0.0,0.1875,0.8125 95,model.layers.13.mlp.gate_proj,tx.13.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15185546875,0.2001953125,0.2392578125,0.1999511867761612,0.0,0.203125,0.3984375,0.1999511867761612,0.0,0.1875,0.75 96,model.layers.13.mlp.up_proj,tx.13.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15771484375,0.2001953125,0.23828125,0.1999511867761612,0.0078125,0.203125,0.390625,0.1999511867761612,0.0,0.1875,0.75 97,model.layers.13.mlp.down_proj,tx.13.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.150390625,0.19970703125,0.26416015625,0.1999860554933548,0.0,0.203125,0.546875,0.1999860554933548,0.0,0.1875,0.8125 98,model.layers.14.self_attn.q_proj,tx.14.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.14892578125,0.2001953125,0.24365234375,0.199951171875,0.0,0.203125,0.4609375,0.199951171875,0.0,0.1875,0.75 99,model.layers.14.self_attn.k_proj,tx.14.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.14794921875,0.19970703125,0.24658203125,0.199951171875,0.0,0.203125,0.6953125,0.199951171875,0.0,0.1875,0.6875 100,model.layers.14.self_attn.v_proj,tx.14.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.16015625,0.19970703125,0.2705078125,0.199951171875,0.0,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.75 101,model.layers.14.self_attn.o_proj,tx.14.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.10009765625,0.19189453125,0.41015625,0.199951171875,0.0,0.1953125,0.5703125,0.199951171875,0.0,0.1875,0.875 102,model.layers.14.mlp.gate_proj,tx.14.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1552734375,0.2001953125,0.24072265625,0.1999511867761612,0.0,0.203125,0.390625,0.1999511867761612,0.0,0.1875,0.75 103,model.layers.14.mlp.up_proj,tx.14.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.16259765625,0.19970703125,0.23486328125,0.1999511867761612,0.0,0.203125,0.40625,0.1999511867761612,0.0,0.1875,0.75 104,model.layers.14.mlp.down_proj,tx.14.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.1318359375,0.2001953125,0.2607421875,0.1999860554933548,0.0078125,0.1953125,0.5078125,0.1999860554933548,0.0,0.1875,0.75 105,model.layers.15.self_attn.q_proj,tx.15.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.154296875,0.2001953125,0.24609375,0.199951171875,0.0,0.203125,0.4453125,0.199951171875,0.0,0.1875,0.75 106,model.layers.15.self_attn.k_proj,tx.15.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15087890625,0.2001953125,0.25244140625,0.199951171875,0.0,0.203125,0.5859375,0.199951171875,0.0,0.1875,0.75 107,model.layers.15.self_attn.v_proj,tx.15.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.150390625,0.19970703125,0.27294921875,0.199951171875,0.0078125,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.6875 108,model.layers.15.self_attn.o_proj,tx.15.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.07568359375,0.1767578125,0.453125,0.199951171875,0.0,0.1796875,0.6015625,0.199951171875,0.0,0.1875,0.9375 109,model.layers.15.mlp.gate_proj,tx.15.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.16015625,0.2001953125,0.24267578125,0.1999511867761612,0.0,0.203125,0.390625,0.1999511867761612,0.0,0.1875,0.8125 110,model.layers.15.mlp.up_proj,tx.15.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15625,0.19970703125,0.2373046875,0.1999511867761612,0.0,0.203125,0.3828125,0.1999511867761612,0.0,0.1875,0.75 111,model.layers.15.mlp.down_proj,tx.15.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14794921875,0.19970703125,0.251953125,0.1999860554933548,0.0,0.1953125,0.53125,0.1999860554933548,0.0,0.1875,0.75 112,model.layers.16.self_attn.q_proj,tx.16.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15576171875,0.2001953125,0.2421875,0.199951171875,0.0,0.203125,0.4296875,0.199951171875,0.0,0.1875,0.75 113,model.layers.16.self_attn.k_proj,tx.16.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1533203125,0.2001953125,0.240234375,0.199951171875,0.0,0.203125,0.578125,0.199951171875,0.0,0.1875,0.6875 114,model.layers.16.self_attn.v_proj,tx.16.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15283203125,0.19921875,0.26806640625,0.199951171875,0.0,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.8125 115,model.layers.16.self_attn.o_proj,tx.16.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.076171875,0.18798828125,0.4033203125,0.199951171875,0.0,0.1875,0.546875,0.199951171875,0.0,0.1875,0.9375 116,model.layers.16.mlp.gate_proj,tx.16.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15478515625,0.2001953125,0.24169921875,0.1999511867761612,0.0,0.203125,0.3828125,0.1999511867761612,0.0,0.1875,0.75 117,model.layers.16.mlp.up_proj,tx.16.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.16064453125,0.19970703125,0.23681640625,0.1999511867761612,0.0078125,0.203125,0.421875,0.1999511867761612,0.0,0.1875,0.8125 118,model.layers.16.mlp.down_proj,tx.16.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.15185546875,0.2001953125,0.2548828125,0.1999860554933548,0.0078125,0.1953125,0.484375,0.1999860554933548,0.0,0.1875,0.8125 119,model.layers.17.self_attn.q_proj,tx.17.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.1533203125,0.2001953125,0.24267578125,0.199951171875,0.0,0.203125,0.4609375,0.199951171875,0.0,0.1875,0.75 120,model.layers.17.self_attn.k_proj,tx.17.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15966796875,0.19970703125,0.2529296875,0.199951171875,0.0,0.203125,0.59375,0.199951171875,0.0,0.1875,0.6875 121,model.layers.17.self_attn.v_proj,tx.17.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.16015625,0.19921875,0.271484375,0.199951171875,0.0078125,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 122,model.layers.17.self_attn.o_proj,tx.17.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.0849609375,0.18310546875,0.44189453125,0.199951171875,0.0,0.1875,0.640625,0.199951171875,0.0,0.1875,0.875 123,model.layers.17.mlp.gate_proj,tx.17.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.158203125,0.19970703125,0.2392578125,0.1999511867761612,0.0,0.203125,0.421875,0.1999511867761612,0.0,0.1875,0.75 124,model.layers.17.mlp.up_proj,tx.17.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1611328125,0.2001953125,0.2373046875,0.1999511867761612,0.0,0.203125,0.4140625,0.1999511867761612,0.0,0.1875,0.8125 125,model.layers.17.mlp.down_proj,tx.17.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.146484375,0.19970703125,0.27392578125,0.1999860554933548,0.0,0.203125,0.625,0.1999860554933548,0.0,0.1875,0.75 126,model.layers.18.self_attn.q_proj,tx.18.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.154296875,0.2001953125,0.24560546875,0.199951171875,0.0,0.203125,0.53125,0.199951171875,0.0,0.1875,0.75 127,model.layers.18.self_attn.k_proj,tx.18.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15673828125,0.2001953125,0.24462890625,0.199951171875,0.0,0.203125,0.65625,0.199951171875,0.0,0.1875,0.75 128,model.layers.18.self_attn.v_proj,tx.18.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15234375,0.19921875,0.27001953125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 129,model.layers.18.self_attn.o_proj,tx.18.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.07421875,0.1513671875,0.587890625,0.199951171875,0.0,0.1640625,0.796875,0.199951171875,0.0,0.1875,1.0 130,model.layers.18.mlp.gate_proj,tx.18.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.158203125,0.2001953125,0.23974609375,0.1999511867761612,0.0,0.203125,0.4140625,0.1999511867761612,0.0,0.1875,0.8125 131,model.layers.18.mlp.up_proj,tx.18.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.162109375,0.19970703125,0.23828125,0.1999511867761612,0.0078125,0.203125,0.4765625,0.1999511867761612,0.0,0.1875,0.75 132,model.layers.18.mlp.down_proj,tx.18.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.15283203125,0.2001953125,0.255859375,0.1999860554933548,0.0,0.203125,0.5,0.1999860554933548,0.0,0.1875,0.8125 133,model.layers.19.self_attn.q_proj,tx.19.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15478515625,0.2001953125,0.24267578125,0.199951171875,0.0,0.203125,0.4375,0.199951171875,0.0,0.1875,0.75 134,model.layers.19.self_attn.k_proj,tx.19.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15380859375,0.2001953125,0.25,0.199951171875,0.0,0.203125,0.625,0.199951171875,0.0,0.1875,0.6875 135,model.layers.19.self_attn.v_proj,tx.19.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15478515625,0.19970703125,0.26953125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 136,model.layers.19.self_attn.o_proj,tx.19.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.05419921875,0.18798828125,0.49072265625,0.199951171875,0.0,0.1875,0.6875,0.199951171875,0.0,0.1875,1.0 137,model.layers.19.mlp.gate_proj,tx.19.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.16015625,0.2001953125,0.2353515625,0.1999511867761612,0.0,0.203125,0.453125,0.1999511867761612,0.0,0.1875,0.8125 138,model.layers.19.mlp.up_proj,tx.19.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.162109375,0.2001953125,0.23681640625,0.1999511867761612,0.0078125,0.203125,0.4765625,0.1999511867761612,0.0,0.1875,0.8125 139,model.layers.19.mlp.down_proj,tx.19.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.1435546875,0.19970703125,0.25830078125,0.1999860554933548,0.0,0.203125,0.4609375,0.1999860554933548,0.0,0.1875,0.75 140,model.layers.20.self_attn.q_proj,tx.20.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.14892578125,0.2001953125,0.24169921875,0.199951171875,0.0,0.203125,0.4375,0.199951171875,0.0,0.1875,0.75 141,model.layers.20.self_attn.k_proj,tx.20.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1474609375,0.2001953125,0.24755859375,0.199951171875,0.0,0.203125,0.625,0.199951171875,0.0,0.1875,0.6875 142,model.layers.20.self_attn.v_proj,tx.20.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15625,0.19970703125,0.28515625,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 143,model.layers.20.self_attn.o_proj,tx.20.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.0791015625,0.171875,0.5244140625,0.199951171875,0.0,0.171875,0.7890625,0.199951171875,0.0,0.1875,1.0 144,model.layers.20.mlp.gate_proj,tx.20.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.16259765625,0.2001953125,0.2392578125,0.1999511867761612,0.0,0.203125,0.4296875,0.1999511867761612,0.0,0.1875,0.8125 145,model.layers.20.mlp.up_proj,tx.20.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15771484375,0.19970703125,0.2373046875,0.1999511867761612,0.0,0.203125,0.4921875,0.1999511867761612,0.0,0.1875,0.8125 146,model.layers.20.mlp.down_proj,tx.20.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14990234375,0.2001953125,0.255859375,0.1999860554933548,0.0,0.203125,0.453125,0.1999860554933548,0.0,0.1875,0.8125 147,model.layers.21.self_attn.q_proj,tx.21.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15380859375,0.2001953125,0.24365234375,0.199951171875,0.0,0.203125,0.40625,0.199951171875,0.0,0.1875,0.75 148,model.layers.21.self_attn.k_proj,tx.21.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15185546875,0.2001953125,0.2431640625,0.199951171875,0.0,0.203125,0.625,0.199951171875,0.0,0.1875,0.75 149,model.layers.21.self_attn.v_proj,tx.21.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15869140625,0.19970703125,0.263671875,0.199951171875,0.0,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.6875 150,model.layers.21.self_attn.o_proj,tx.21.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.0634765625,0.169921875,0.57275390625,0.199951171875,0.0,0.1796875,0.8359375,0.199951171875,0.0,0.1875,0.9375 151,model.layers.21.mlp.gate_proj,tx.21.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15869140625,0.2001953125,0.24169921875,0.1999511867761612,0.0,0.203125,0.484375,0.1999511867761612,0.0,0.1875,0.8125 152,model.layers.21.mlp.up_proj,tx.21.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.162109375,0.19970703125,0.2373046875,0.1999511867761612,0.0078125,0.203125,0.4609375,0.1999511867761612,0.0,0.1875,0.8125 153,model.layers.21.mlp.down_proj,tx.21.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.142578125,0.19970703125,0.25390625,0.1999860554933548,0.0,0.203125,0.4296875,0.1999860554933548,0.0,0.1875,0.75 154,model.layers.22.self_attn.q_proj,tx.22.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15283203125,0.2001953125,0.248046875,0.199951171875,0.0,0.203125,0.40625,0.199951171875,0.0,0.1875,0.8125 155,model.layers.22.self_attn.k_proj,tx.22.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15380859375,0.2001953125,0.24853515625,0.199951171875,0.0,0.203125,0.6875,0.199951171875,0.0,0.1875,0.625 156,model.layers.22.self_attn.v_proj,tx.22.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15283203125,0.19921875,0.267578125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 157,model.layers.22.self_attn.o_proj,tx.22.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.07470703125,0.1943359375,0.41650390625,0.199951171875,0.0,0.1875,0.59375,0.199951171875,0.0,0.1875,0.875 158,model.layers.22.mlp.gate_proj,tx.22.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1572265625,0.2001953125,0.2373046875,0.1999511867761612,0.0,0.203125,0.4296875,0.1999511867761612,0.0,0.1875,0.8125 159,model.layers.22.mlp.up_proj,tx.22.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1650390625,0.2001953125,0.23876953125,0.1999511867761612,0.0,0.203125,0.484375,0.1999511867761612,0.0,0.1875,0.8125 160,model.layers.22.mlp.down_proj,tx.22.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14306640625,0.19970703125,0.25537109375,0.1999860554933548,0.0,0.203125,0.4375,0.1999860554933548,0.0,0.1875,0.75 161,model.layers.23.self_attn.q_proj,tx.23.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.14892578125,0.2001953125,0.24560546875,0.199951171875,0.0,0.203125,0.40625,0.199951171875,0.0,0.1875,0.75 162,model.layers.23.self_attn.k_proj,tx.23.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15380859375,0.2001953125,0.244140625,0.199951171875,0.0,0.203125,0.6328125,0.199951171875,0.0,0.1875,0.75 163,model.layers.23.self_attn.v_proj,tx.23.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15966796875,0.2001953125,0.26953125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 164,model.layers.23.self_attn.o_proj,tx.23.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.06884765625,0.19287109375,0.3935546875,0.199951171875,0.0,0.1875,0.5546875,0.199951171875,0.0,0.1875,0.875 165,model.layers.23.mlp.gate_proj,tx.23.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.16015625,0.2001953125,0.2392578125,0.1999511867761612,0.0,0.203125,0.5,0.1999511867761612,0.0,0.1875,0.8125 166,model.layers.23.mlp.up_proj,tx.23.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.162109375,0.2001953125,0.24072265625,0.1999511867761612,0.0,0.203125,0.5,0.1999511867761612,0.0,0.1875,0.8125 167,model.layers.23.mlp.down_proj,tx.23.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.13720703125,0.2001953125,0.255859375,0.1999860554933548,0.0,0.203125,0.4453125,0.1999860554933548,0.0,0.1875,0.75 168,model.layers.24.self_attn.q_proj,tx.24.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15234375,0.19970703125,0.244140625,0.199951171875,0.0,0.203125,0.4140625,0.199951171875,0.0,0.1875,0.75 169,model.layers.24.self_attn.k_proj,tx.24.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15380859375,0.2001953125,0.2470703125,0.199951171875,0.0,0.203125,0.65625,0.199951171875,0.0,0.1875,0.6875 170,model.layers.24.self_attn.v_proj,tx.24.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15380859375,0.19970703125,0.27197265625,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.6875 171,model.layers.24.self_attn.o_proj,tx.24.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.06396484375,0.17626953125,0.43017578125,0.199951171875,0.0,0.1796875,0.609375,0.199951171875,0.0,0.1875,0.9375 172,model.layers.24.mlp.gate_proj,tx.24.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1591796875,0.2001953125,0.240234375,0.1999511867761612,0.0,0.203125,0.4453125,0.1999511867761612,0.0,0.1875,0.75 173,model.layers.24.mlp.up_proj,tx.24.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15966796875,0.2001953125,0.2431640625,0.1999511867761612,0.0,0.203125,0.4765625,0.1999511867761612,0.0,0.1875,0.8125 174,model.layers.24.mlp.down_proj,tx.24.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.1455078125,0.2001953125,0.25244140625,0.1999860554933548,0.0,0.203125,0.4140625,0.1999860554933548,0.0,0.1875,0.8125 175,model.layers.25.self_attn.q_proj,tx.25.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.14990234375,0.2001953125,0.24755859375,0.199951171875,0.0,0.203125,0.390625,0.199951171875,0.0,0.1875,0.75 176,model.layers.25.self_attn.k_proj,tx.25.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.14990234375,0.2001953125,0.248046875,0.199951171875,0.0,0.203125,0.578125,0.199951171875,0.0,0.1875,0.6875 177,model.layers.25.self_attn.v_proj,tx.25.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15087890625,0.19970703125,0.27392578125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.6875 178,model.layers.25.self_attn.o_proj,tx.25.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.06201171875,0.162109375,0.609375,0.199951171875,0.0,0.171875,0.8046875,0.199951171875,0.0,0.1875,1.0 179,model.layers.25.mlp.gate_proj,tx.25.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15576171875,0.19970703125,0.24365234375,0.1999511867761612,0.0,0.203125,0.4453125,0.1999511867761612,0.0,0.1875,0.8125 180,model.layers.25.mlp.up_proj,tx.25.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15283203125,0.19970703125,0.2431640625,0.1999511867761612,0.0,0.203125,0.4921875,0.1999511867761612,0.0,0.1875,0.8125 181,model.layers.25.mlp.down_proj,tx.25.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.1435546875,0.2001953125,0.25732421875,0.1999860554933548,0.0,0.203125,0.4296875,0.1999860554933548,0.0,0.1875,0.8125 182,model.layers.26.self_attn.q_proj,tx.26.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.150390625,0.2001953125,0.248046875,0.199951171875,0.0,0.203125,0.4140625,0.199951171875,0.0,0.1875,0.75 183,model.layers.26.self_attn.k_proj,tx.26.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15234375,0.2001953125,0.25146484375,0.199951171875,0.0,0.203125,0.6640625,0.199951171875,0.0,0.1875,0.6875 184,model.layers.26.self_attn.v_proj,tx.26.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1591796875,0.19970703125,0.275390625,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.6875 185,model.layers.26.self_attn.o_proj,tx.26.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.068359375,0.169921875,0.4501953125,0.199951171875,0.0,0.171875,0.6015625,0.199951171875,0.0,0.1875,0.9375 186,model.layers.26.mlp.gate_proj,tx.26.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15966796875,0.2001953125,0.2392578125,0.1999511867761612,0.0,0.203125,0.484375,0.1999511867761612,0.0,0.1875,0.8125 187,model.layers.26.mlp.up_proj,tx.26.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1533203125,0.19970703125,0.2421875,0.1999511867761612,0.0,0.203125,0.4921875,0.1999511867761612,0.0,0.1875,0.8125 188,model.layers.26.mlp.down_proj,tx.26.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.13818359375,0.2001953125,0.251953125,0.1999860554933548,0.0,0.203125,0.4375,0.1999860554933548,0.0,0.1875,0.8125 189,model.layers.27.self_attn.q_proj,tx.27.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15087890625,0.2001953125,0.27099609375,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 190,model.layers.27.self_attn.k_proj,tx.27.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.14697265625,0.19970703125,0.271484375,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 191,model.layers.27.self_attn.v_proj,tx.27.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15673828125,0.19970703125,0.26953125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.6875 192,model.layers.27.self_attn.o_proj,tx.27.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.06787109375,0.18115234375,0.42138671875,0.199951171875,0.0,0.1796875,0.6328125,0.199951171875,0.0,0.1875,0.875 193,model.layers.27.mlp.gate_proj,tx.27.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.162109375,0.2001953125,0.24072265625,0.1999511867761612,0.0,0.203125,0.4609375,0.1999511867761612,0.0,0.1875,0.75 194,model.layers.27.mlp.up_proj,tx.27.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.15673828125,0.2001953125,0.236328125,0.1999511867761612,0.0,0.203125,0.5234375,0.1999511867761612,0.0,0.1875,0.8125 195,model.layers.27.mlp.down_proj,tx.27.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14013671875,0.2001953125,0.2509765625,0.1999860554933548,0.0,0.203125,0.4296875,0.1999860554933548,0.0,0.1875,0.75 196,model.layers.28.self_attn.q_proj,tx.28.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.14794921875,0.2001953125,0.24853515625,0.199951171875,0.0,0.203125,0.3828125,0.199951171875,0.0,0.1875,0.75 197,model.layers.28.self_attn.k_proj,tx.28.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15234375,0.2001953125,0.25,0.199951171875,0.0,0.203125,0.6171875,0.199951171875,0.0,0.1875,0.75 198,model.layers.28.self_attn.v_proj,tx.28.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15869140625,0.19921875,0.2744140625,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 199,model.layers.28.self_attn.o_proj,tx.28.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.05908203125,0.19091796875,0.46923828125,0.199951171875,0.0,0.1875,0.6015625,0.199951171875,0.0,0.1875,0.875 200,model.layers.28.mlp.gate_proj,tx.28.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.14990234375,0.2001953125,0.2392578125,0.1999511867761612,0.0,0.203125,0.453125,0.1999511867761612,0.0,0.1875,0.75 201,model.layers.28.mlp.up_proj,tx.28.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1572265625,0.19970703125,0.23876953125,0.1999511867761612,0.0,0.203125,0.4375,0.1999511867761612,0.0,0.1875,0.8125 202,model.layers.28.mlp.down_proj,tx.28.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.1357421875,0.2001953125,0.25927734375,0.1999860554933548,0.0,0.2109375,0.4140625,0.1999860554933548,0.0,0.1875,0.75 203,model.layers.29.self_attn.q_proj,tx.29.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.15234375,0.2001953125,0.291015625,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 204,model.layers.29.self_attn.k_proj,tx.29.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.14599609375,0.20068359375,0.26904296875,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.6875 205,model.layers.29.self_attn.v_proj,tx.29.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.15966796875,0.19921875,0.27099609375,0.199951171875,0.0078125,0.203125,1.0,0.199951171875,0.0,0.1875,0.8125 206,model.layers.29.self_attn.o_proj,tx.29.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.04248046875,0.21533203125,0.38720703125,0.199951171875,0.0,0.1953125,0.546875,0.199951171875,0.0,0.1875,0.9375 207,model.layers.29.mlp.gate_proj,tx.29.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1552734375,0.19970703125,0.23876953125,0.1999511867761612,0.0,0.203125,0.484375,0.1999511867761612,0.0,0.1875,0.8125 208,model.layers.29.mlp.up_proj,tx.29.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.158203125,0.2001953125,0.24072265625,0.1999511867761612,0.0,0.203125,0.4453125,0.1999511867761612,0.0,0.1875,0.75 209,model.layers.29.mlp.down_proj,tx.29.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.14453125,0.2001953125,0.2587890625,0.1999860554933548,0.0,0.2109375,0.421875,0.1999860554933548,0.0,0.1875,0.8125 210,model.layers.30.self_attn.q_proj,tx.30.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.14404296875,0.2001953125,0.24462890625,0.199951171875,0.0,0.203125,0.390625,0.199951171875,0.0,0.1875,0.75 211,model.layers.30.self_attn.k_proj,tx.30.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.14453125,0.2001953125,0.25,0.199951171875,0.0,0.203125,0.59375,0.199951171875,0.0,0.1875,0.75 212,model.layers.30.self_attn.v_proj,tx.30.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1513671875,0.19921875,0.28173828125,0.199951171875,0.0,0.203125,1.0,0.199951171875,0.0,0.1875,0.75 213,model.layers.30.self_attn.o_proj,tx.30.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.05322265625,0.17919921875,0.6240234375,0.199951171875,0.0,0.1796875,0.7421875,0.199951171875,0.0,0.1875,1.0 214,model.layers.30.mlp.gate_proj,tx.30.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.162109375,0.2001953125,0.24609375,0.1999511867761612,0.0,0.203125,0.5703125,0.1999511867761612,0.0,0.1875,0.75 215,model.layers.30.mlp.up_proj,tx.30.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1552734375,0.2001953125,0.2412109375,0.1999511867761612,0.0,0.203125,0.515625,0.1999511867761612,0.0,0.1875,0.8125 216,model.layers.30.mlp.down_proj,tx.30.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.13427734375,0.2001953125,0.25927734375,0.1999860554933548,0.0,0.2109375,0.46875,0.1999860554933548,0.0,0.1875,0.75 217,model.layers.31.self_attn.q_proj,tx.31.attn.q,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.146484375,0.19970703125,0.24951171875,0.199951171875,0.0,0.203125,0.625,0.199951171875,0.0,0.1875,0.75 218,model.layers.31.self_attn.k_proj,tx.31.attn.k,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.14404296875,0.19970703125,0.23974609375,0.199951171875,0.0,0.203125,0.6484375,0.199951171875,0.0,0.1875,0.75 219,model.layers.31.self_attn.v_proj,tx.31.attn.v,Linear,weight,"[1024, 4096]",4194304,3355648,0.199951171875,"(128, 16)",8 x 256,2048,0.199951171875,0.1357421875,0.19970703125,0.26953125,0.199951171875,0.0,0.203125,0.9921875,0.199951171875,0.0,0.1875,0.6875 220,model.layers.31.self_attn.o_proj,tx.31.attn.o,Linear,weight,"[4096, 4096]",16777216,13422592,0.199951171875,"(128, 16)",32 x 256,8192,0.199951171875,0.02783203125,0.1728515625,0.435546875,0.199951171875,0.0,0.1796875,0.65625,0.199951171875,0.0,0.1875,0.9375 221,model.layers.31.mlp.gate_proj,tx.31.mlp.gate,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.162109375,0.2001953125,0.2470703125,0.1999511867761612,0.0078125,0.203125,0.5546875,0.1999511867761612,0.0,0.1875,0.8125 222,model.layers.31.mlp.up_proj,tx.31.mlp.up,Linear,weight,"[14336, 4096]",58720256,46979072,0.19995111227035522,"(128, 16)",112 x 256,28672,0.1999511867761612,0.1591796875,0.2001953125,0.24072265625,0.1999511867761612,0.0078125,0.203125,0.53125,0.1999511867761612,0.0,0.1875,0.8125 223,model.layers.31.mlp.down_proj,tx.31.mlp.down,Linear,weight,"[4096, 14336]",58720256,46977024,0.1999860405921936,"(128, 16)",32 x 896,28672,0.1999860554933548,0.12353515625,0.2001953125,0.283203125,0.1999860554933548,0.0,0.21875,0.5703125,0.1999860554933548,0.0,0.1875,0.8125 224,lm_head,lm_head,Linear,weight,"[128256, 4096]",525336576,525336576,0.0,"(128, 16)",1002 x 256,256512,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0