program(1.3) [buildInfo = dict({{"coremlc-component-MIL", "3400.43.1"}, {"coremlc-version", "3400.58.2"}, {"coremltools-component-torch", "2.4.1"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "8.0"}})] { func main(tensor logmel_data) { string var_68_pad_type_0 = const()[name = string("op_68_pad_type_0"), val = string("custom")]; tensor var_68_pad_0 = const()[name = string("op_68_pad_0"), val = tensor([1, 1])]; tensor var_68_strides_0 = const()[name = string("op_68_strides_0"), val = tensor([1])]; tensor var_68_dilations_0 = const()[name = string("op_68_dilations_0"), val = tensor([1])]; int32 var_68_groups_0 = const()[name = string("op_68_groups_0"), val = int32(1)]; tensor weight_3_to_fp16 = const()[name = string("weight_3_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64)))]; tensor bias_3_to_fp16 = const()[name = string("bias_3_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(491648)))]; tensor var_68_cast_fp16 = conv(bias = bias_3_to_fp16, dilations = var_68_dilations_0, groups = var_68_groups_0, pad = var_68_pad_0, pad_type = var_68_pad_type_0, strides = var_68_strides_0, weight = weight_3_to_fp16, x = logmel_data)[name = string("op_68_cast_fp16")]; string input_1_mode_0 = const()[name = string("input_1_mode_0"), val = string("EXACT")]; tensor input_1_cast_fp16 = gelu(mode = input_1_mode_0, x = var_68_cast_fp16)[name = string("input_1_cast_fp16")]; string var_86_pad_type_0 = const()[name = string("op_86_pad_type_0"), val = string("custom")]; tensor var_86_pad_0 = const()[name = string("op_86_pad_0"), val = tensor([1, 1])]; tensor var_86_strides_0 = const()[name = string("op_86_strides_0"), val = tensor([2])]; tensor var_86_dilations_0 = const()[name = string("op_86_dilations_0"), val = tensor([1])]; int32 var_86_groups_0 = const()[name = string("op_86_groups_0"), val = int32(1)]; tensor weight_7_to_fp16 = const()[name = string("weight_7_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(493760)))]; tensor bias_7_to_fp16 = const()[name = string("bias_7_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(6785280)))]; tensor var_86_cast_fp16 = conv(bias = bias_7_to_fp16, dilations = var_86_dilations_0, groups = var_86_groups_0, pad = var_86_pad_0, pad_type = var_86_pad_type_0, strides = var_86_strides_0, weight = weight_7_to_fp16, x = input_1_cast_fp16)[name = string("op_86_cast_fp16")]; string x_3_mode_0 = const()[name = string("x_3_mode_0"), val = string("EXACT")]; tensor x_3_cast_fp16 = gelu(mode = x_3_mode_0, x = var_86_cast_fp16)[name = string("x_3_cast_fp16")]; tensor var_92 = const()[name = string("op_92"), val = tensor([0, 2, 1])]; tensor positional_embedding_to_fp16 = const()[name = string("positional_embedding_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(6787392)))]; tensor x_5_cast_fp16 = transpose(perm = var_92, x = x_3_cast_fp16)[name = string("transpose_240")]; tensor var_95_cast_fp16 = add(x = x_5_cast_fp16, y = positional_embedding_to_fp16)[name = string("op_95_cast_fp16")]; int32 var_108 = const()[name = string("op_108"), val = int32(-1)]; tensor var_124_axes_0 = const()[name = string("op_124_axes_0"), val = tensor([-1])]; tensor blocks_0_attn_ln_weight_to_fp16 = const()[name = string("blocks_0_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(9859456)))]; tensor blocks_0_attn_ln_bias_to_fp16 = const()[name = string("blocks_0_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(9861568)))]; fp16 var_114_to_fp16 = const()[name = string("op_114_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_124_cast_fp16 = layer_norm(axes = var_124_axes_0, beta = blocks_0_attn_ln_bias_to_fp16, epsilon = var_114_to_fp16, gamma = blocks_0_attn_ln_weight_to_fp16, x = var_95_cast_fp16)[name = string("op_124_cast_fp16")]; tensor var_135_to_fp16 = const()[name = string("op_135_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(9863680)))]; tensor var_136_to_fp16 = const()[name = string("op_136_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(11960896)))]; tensor linear_0_cast_fp16 = linear(bias = var_136_to_fp16, weight = var_135_to_fp16, x = var_124_cast_fp16)[name = string("linear_0_cast_fp16")]; tensor var_139_to_fp16 = const()[name = string("op_139_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(11963008)))]; tensor linear_1_bias_0_to_fp16 = const()[name = string("linear_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(14060224)))]; tensor linear_1_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_139_to_fp16, x = var_124_cast_fp16)[name = string("linear_1_cast_fp16")]; tensor var_143_to_fp16 = const()[name = string("op_143_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(14062336)))]; tensor var_144_to_fp16 = const()[name = string("op_144_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(16159552)))]; tensor linear_2_cast_fp16 = linear(bias = var_144_to_fp16, weight = var_143_to_fp16, x = var_124_cast_fp16)[name = string("linear_2_cast_fp16")]; tensor var_152 = const()[name = string("op_152"), val = tensor([1, 1500, 16, -1])]; tensor var_153_cast_fp16 = reshape(shape = var_152, x = linear_0_cast_fp16)[name = string("op_153_cast_fp16")]; tensor const_168_to_fp16 = const()[name = string("const_168_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_3_cast_fp16 = mul(x = var_153_cast_fp16, y = const_168_to_fp16)[name = string("q_3_cast_fp16")]; tensor var_159 = const()[name = string("op_159"), val = tensor([1, 1500, 16, -1])]; tensor var_160_cast_fp16 = reshape(shape = var_159, x = linear_1_cast_fp16)[name = string("op_160_cast_fp16")]; tensor const_169_to_fp16 = const()[name = string("const_169_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_3_cast_fp16 = mul(x = var_160_cast_fp16, y = const_169_to_fp16)[name = string("k_3_cast_fp16")]; tensor var_166 = const()[name = string("op_166"), val = tensor([1, 1500, 16, -1])]; tensor var_167_cast_fp16 = reshape(shape = var_166, x = linear_2_cast_fp16)[name = string("op_167_cast_fp16")]; tensor var_168 = const()[name = string("op_168"), val = tensor([0, 2, 1, 3])]; bool qk_1_transpose_x_0 = const()[name = string("qk_1_transpose_x_0"), val = bool(false)]; bool qk_1_transpose_y_0 = const()[name = string("qk_1_transpose_y_0"), val = bool(false)]; tensor transpose_96_perm_0 = const()[name = string("transpose_96_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_97_perm_0 = const()[name = string("transpose_97_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_97 = transpose(perm = transpose_97_perm_0, x = k_3_cast_fp16)[name = string("transpose_237")]; tensor transpose_96 = transpose(perm = transpose_96_perm_0, x = q_3_cast_fp16)[name = string("transpose_238")]; tensor qk_1_cast_fp16 = matmul(transpose_x = qk_1_transpose_x_0, transpose_y = qk_1_transpose_y_0, x = transpose_96, y = transpose_97)[name = string("qk_1_cast_fp16")]; tensor var_172_cast_fp16 = softmax(axis = var_108, x = qk_1_cast_fp16)[name = string("op_172_cast_fp16")]; bool var_174_transpose_x_0 = const()[name = string("op_174_transpose_x_0"), val = bool(false)]; bool var_174_transpose_y_0 = const()[name = string("op_174_transpose_y_0"), val = bool(false)]; tensor v_3_cast_fp16 = transpose(perm = var_168, x = var_167_cast_fp16)[name = string("transpose_239")]; tensor var_174_cast_fp16 = matmul(transpose_x = var_174_transpose_x_0, transpose_y = var_174_transpose_y_0, x = var_172_cast_fp16, y = v_3_cast_fp16)[name = string("op_174_cast_fp16")]; tensor var_175 = const()[name = string("op_175"), val = tensor([0, 2, 1, 3])]; tensor concat_0 = const()[name = string("concat_0"), val = tensor([1, 1500, 1024])]; tensor var_176_cast_fp16 = transpose(perm = var_175, x = var_174_cast_fp16)[name = string("transpose_236")]; tensor x_11_cast_fp16 = reshape(shape = concat_0, x = var_176_cast_fp16)[name = string("x_11_cast_fp16")]; tensor var_180_to_fp16 = const()[name = string("op_180_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(16161664)))]; tensor var_181_to_fp16 = const()[name = string("op_181_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18258880)))]; tensor linear_3_cast_fp16 = linear(bias = var_181_to_fp16, weight = var_180_to_fp16, x = x_11_cast_fp16)[name = string("linear_3_cast_fp16")]; tensor x_13_cast_fp16 = add(x = var_95_cast_fp16, y = linear_3_cast_fp16)[name = string("x_13_cast_fp16")]; tensor var_188_axes_0 = const()[name = string("op_188_axes_0"), val = tensor([-1])]; tensor blocks_0_mlp_ln_weight_to_fp16 = const()[name = string("blocks_0_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18260992)))]; tensor blocks_0_mlp_ln_bias_to_fp16 = const()[name = string("blocks_0_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18263104)))]; tensor var_188_cast_fp16 = layer_norm(axes = var_188_axes_0, beta = blocks_0_mlp_ln_bias_to_fp16, epsilon = var_114_to_fp16, gamma = blocks_0_mlp_ln_weight_to_fp16, x = x_13_cast_fp16)[name = string("op_188_cast_fp16")]; tensor var_197_to_fp16 = const()[name = string("op_197_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18265216)))]; tensor var_198_to_fp16 = const()[name = string("op_198_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(26653888)))]; tensor linear_4_cast_fp16 = linear(bias = var_198_to_fp16, weight = var_197_to_fp16, x = var_188_cast_fp16)[name = string("linear_4_cast_fp16")]; string x_17_mode_0 = const()[name = string("x_17_mode_0"), val = string("EXACT")]; tensor x_17_cast_fp16 = gelu(mode = x_17_mode_0, x = linear_4_cast_fp16)[name = string("x_17_cast_fp16")]; tensor var_203_to_fp16 = const()[name = string("op_203_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(26662144)))]; tensor var_204_to_fp16 = const()[name = string("op_204_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35050816)))]; tensor linear_5_cast_fp16 = linear(bias = var_204_to_fp16, weight = var_203_to_fp16, x = x_17_cast_fp16)[name = string("linear_5_cast_fp16")]; tensor x_19_cast_fp16 = add(x = x_13_cast_fp16, y = linear_5_cast_fp16)[name = string("x_19_cast_fp16")]; int32 var_214 = const()[name = string("op_214"), val = int32(-1)]; tensor var_230_axes_0 = const()[name = string("op_230_axes_0"), val = tensor([-1])]; tensor blocks_1_attn_ln_weight_to_fp16 = const()[name = string("blocks_1_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35052928)))]; tensor blocks_1_attn_ln_bias_to_fp16 = const()[name = string("blocks_1_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35055040)))]; fp16 var_220_to_fp16 = const()[name = string("op_220_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_230_cast_fp16 = layer_norm(axes = var_230_axes_0, beta = blocks_1_attn_ln_bias_to_fp16, epsilon = var_220_to_fp16, gamma = blocks_1_attn_ln_weight_to_fp16, x = x_19_cast_fp16)[name = string("op_230_cast_fp16")]; tensor var_241_to_fp16 = const()[name = string("op_241_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(35057152)))]; tensor var_242_to_fp16 = const()[name = string("op_242_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(37154368)))]; tensor linear_6_cast_fp16 = linear(bias = var_242_to_fp16, weight = var_241_to_fp16, x = var_230_cast_fp16)[name = string("linear_6_cast_fp16")]; tensor var_245_to_fp16 = const()[name = string("op_245_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(37156480)))]; tensor linear_7_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_245_to_fp16, x = var_230_cast_fp16)[name = string("linear_7_cast_fp16")]; tensor var_249_to_fp16 = const()[name = string("op_249_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(39253696)))]; tensor var_250_to_fp16 = const()[name = string("op_250_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41350912)))]; tensor linear_8_cast_fp16 = linear(bias = var_250_to_fp16, weight = var_249_to_fp16, x = var_230_cast_fp16)[name = string("linear_8_cast_fp16")]; tensor var_258 = const()[name = string("op_258"), val = tensor([1, 1500, 16, -1])]; tensor var_259_cast_fp16 = reshape(shape = var_258, x = linear_6_cast_fp16)[name = string("op_259_cast_fp16")]; tensor const_170_to_fp16 = const()[name = string("const_170_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_7_cast_fp16 = mul(x = var_259_cast_fp16, y = const_170_to_fp16)[name = string("q_7_cast_fp16")]; tensor var_265 = const()[name = string("op_265"), val = tensor([1, 1500, 16, -1])]; tensor var_266_cast_fp16 = reshape(shape = var_265, x = linear_7_cast_fp16)[name = string("op_266_cast_fp16")]; tensor const_171_to_fp16 = const()[name = string("const_171_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_7_cast_fp16 = mul(x = var_266_cast_fp16, y = const_171_to_fp16)[name = string("k_7_cast_fp16")]; tensor var_272 = const()[name = string("op_272"), val = tensor([1, 1500, 16, -1])]; tensor var_273_cast_fp16 = reshape(shape = var_272, x = linear_8_cast_fp16)[name = string("op_273_cast_fp16")]; tensor var_274 = const()[name = string("op_274"), val = tensor([0, 2, 1, 3])]; bool qk_3_transpose_x_0 = const()[name = string("qk_3_transpose_x_0"), val = bool(false)]; bool qk_3_transpose_y_0 = const()[name = string("qk_3_transpose_y_0"), val = bool(false)]; tensor transpose_98_perm_0 = const()[name = string("transpose_98_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_99_perm_0 = const()[name = string("transpose_99_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_99 = transpose(perm = transpose_99_perm_0, x = k_7_cast_fp16)[name = string("transpose_233")]; tensor transpose_98 = transpose(perm = transpose_98_perm_0, x = q_7_cast_fp16)[name = string("transpose_234")]; tensor qk_3_cast_fp16 = matmul(transpose_x = qk_3_transpose_x_0, transpose_y = qk_3_transpose_y_0, x = transpose_98, y = transpose_99)[name = string("qk_3_cast_fp16")]; tensor var_278_cast_fp16 = softmax(axis = var_214, x = qk_3_cast_fp16)[name = string("op_278_cast_fp16")]; bool var_280_transpose_x_0 = const()[name = string("op_280_transpose_x_0"), val = bool(false)]; bool var_280_transpose_y_0 = const()[name = string("op_280_transpose_y_0"), val = bool(false)]; tensor v_7_cast_fp16 = transpose(perm = var_274, x = var_273_cast_fp16)[name = string("transpose_235")]; tensor var_280_cast_fp16 = matmul(transpose_x = var_280_transpose_x_0, transpose_y = var_280_transpose_y_0, x = var_278_cast_fp16, y = v_7_cast_fp16)[name = string("op_280_cast_fp16")]; tensor var_281 = const()[name = string("op_281"), val = tensor([0, 2, 1, 3])]; tensor concat_1 = const()[name = string("concat_1"), val = tensor([1, 1500, 1024])]; tensor var_282_cast_fp16 = transpose(perm = var_281, x = var_280_cast_fp16)[name = string("transpose_232")]; tensor x_23_cast_fp16 = reshape(shape = concat_1, x = var_282_cast_fp16)[name = string("x_23_cast_fp16")]; tensor var_286_to_fp16 = const()[name = string("op_286_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(41353024)))]; tensor var_287_to_fp16 = const()[name = string("op_287_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(43450240)))]; tensor linear_9_cast_fp16 = linear(bias = var_287_to_fp16, weight = var_286_to_fp16, x = x_23_cast_fp16)[name = string("linear_9_cast_fp16")]; tensor x_25_cast_fp16 = add(x = x_19_cast_fp16, y = linear_9_cast_fp16)[name = string("x_25_cast_fp16")]; tensor var_294_axes_0 = const()[name = string("op_294_axes_0"), val = tensor([-1])]; tensor blocks_1_mlp_ln_weight_to_fp16 = const()[name = string("blocks_1_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(43452352)))]; tensor blocks_1_mlp_ln_bias_to_fp16 = const()[name = string("blocks_1_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(43454464)))]; tensor var_294_cast_fp16 = layer_norm(axes = var_294_axes_0, beta = blocks_1_mlp_ln_bias_to_fp16, epsilon = var_220_to_fp16, gamma = blocks_1_mlp_ln_weight_to_fp16, x = x_25_cast_fp16)[name = string("op_294_cast_fp16")]; tensor var_303_to_fp16 = const()[name = string("op_303_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(43456576)))]; tensor var_304_to_fp16 = const()[name = string("op_304_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51845248)))]; tensor linear_10_cast_fp16 = linear(bias = var_304_to_fp16, weight = var_303_to_fp16, x = var_294_cast_fp16)[name = string("linear_10_cast_fp16")]; string x_29_mode_0 = const()[name = string("x_29_mode_0"), val = string("EXACT")]; tensor x_29_cast_fp16 = gelu(mode = x_29_mode_0, x = linear_10_cast_fp16)[name = string("x_29_cast_fp16")]; tensor var_309_to_fp16 = const()[name = string("op_309_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(51853504)))]; tensor var_310_to_fp16 = const()[name = string("op_310_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(60242176)))]; tensor linear_11_cast_fp16 = linear(bias = var_310_to_fp16, weight = var_309_to_fp16, x = x_29_cast_fp16)[name = string("linear_11_cast_fp16")]; tensor x_31_cast_fp16 = add(x = x_25_cast_fp16, y = linear_11_cast_fp16)[name = string("x_31_cast_fp16")]; int32 var_320 = const()[name = string("op_320"), val = int32(-1)]; tensor var_336_axes_0 = const()[name = string("op_336_axes_0"), val = tensor([-1])]; tensor blocks_2_attn_ln_weight_to_fp16 = const()[name = string("blocks_2_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(60244288)))]; tensor blocks_2_attn_ln_bias_to_fp16 = const()[name = string("blocks_2_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(60246400)))]; fp16 var_326_to_fp16 = const()[name = string("op_326_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_336_cast_fp16 = layer_norm(axes = var_336_axes_0, beta = blocks_2_attn_ln_bias_to_fp16, epsilon = var_326_to_fp16, gamma = blocks_2_attn_ln_weight_to_fp16, x = x_31_cast_fp16)[name = string("op_336_cast_fp16")]; tensor var_347_to_fp16 = const()[name = string("op_347_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(60248512)))]; tensor var_348_to_fp16 = const()[name = string("op_348_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62345728)))]; tensor linear_12_cast_fp16 = linear(bias = var_348_to_fp16, weight = var_347_to_fp16, x = var_336_cast_fp16)[name = string("linear_12_cast_fp16")]; tensor var_351_to_fp16 = const()[name = string("op_351_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(62347840)))]; tensor linear_13_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_351_to_fp16, x = var_336_cast_fp16)[name = string("linear_13_cast_fp16")]; tensor var_355_to_fp16 = const()[name = string("op_355_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64445056)))]; tensor var_356_to_fp16 = const()[name = string("op_356_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66542272)))]; tensor linear_14_cast_fp16 = linear(bias = var_356_to_fp16, weight = var_355_to_fp16, x = var_336_cast_fp16)[name = string("linear_14_cast_fp16")]; tensor var_364 = const()[name = string("op_364"), val = tensor([1, 1500, 16, -1])]; tensor var_365_cast_fp16 = reshape(shape = var_364, x = linear_12_cast_fp16)[name = string("op_365_cast_fp16")]; tensor const_172_to_fp16 = const()[name = string("const_172_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_11_cast_fp16 = mul(x = var_365_cast_fp16, y = const_172_to_fp16)[name = string("q_11_cast_fp16")]; tensor var_371 = const()[name = string("op_371"), val = tensor([1, 1500, 16, -1])]; tensor var_372_cast_fp16 = reshape(shape = var_371, x = linear_13_cast_fp16)[name = string("op_372_cast_fp16")]; tensor const_173_to_fp16 = const()[name = string("const_173_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_11_cast_fp16 = mul(x = var_372_cast_fp16, y = const_173_to_fp16)[name = string("k_11_cast_fp16")]; tensor var_378 = const()[name = string("op_378"), val = tensor([1, 1500, 16, -1])]; tensor var_379_cast_fp16 = reshape(shape = var_378, x = linear_14_cast_fp16)[name = string("op_379_cast_fp16")]; tensor var_380 = const()[name = string("op_380"), val = tensor([0, 2, 1, 3])]; bool qk_5_transpose_x_0 = const()[name = string("qk_5_transpose_x_0"), val = bool(false)]; bool qk_5_transpose_y_0 = const()[name = string("qk_5_transpose_y_0"), val = bool(false)]; tensor transpose_100_perm_0 = const()[name = string("transpose_100_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_101_perm_0 = const()[name = string("transpose_101_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_101 = transpose(perm = transpose_101_perm_0, x = k_11_cast_fp16)[name = string("transpose_229")]; tensor transpose_100 = transpose(perm = transpose_100_perm_0, x = q_11_cast_fp16)[name = string("transpose_230")]; tensor qk_5_cast_fp16 = matmul(transpose_x = qk_5_transpose_x_0, transpose_y = qk_5_transpose_y_0, x = transpose_100, y = transpose_101)[name = string("qk_5_cast_fp16")]; tensor var_384_cast_fp16 = softmax(axis = var_320, x = qk_5_cast_fp16)[name = string("op_384_cast_fp16")]; bool var_386_transpose_x_0 = const()[name = string("op_386_transpose_x_0"), val = bool(false)]; bool var_386_transpose_y_0 = const()[name = string("op_386_transpose_y_0"), val = bool(false)]; tensor v_11_cast_fp16 = transpose(perm = var_380, x = var_379_cast_fp16)[name = string("transpose_231")]; tensor var_386_cast_fp16 = matmul(transpose_x = var_386_transpose_x_0, transpose_y = var_386_transpose_y_0, x = var_384_cast_fp16, y = v_11_cast_fp16)[name = string("op_386_cast_fp16")]; tensor var_387 = const()[name = string("op_387"), val = tensor([0, 2, 1, 3])]; tensor concat_2 = const()[name = string("concat_2"), val = tensor([1, 1500, 1024])]; tensor var_388_cast_fp16 = transpose(perm = var_387, x = var_386_cast_fp16)[name = string("transpose_228")]; tensor x_35_cast_fp16 = reshape(shape = concat_2, x = var_388_cast_fp16)[name = string("x_35_cast_fp16")]; tensor var_392_to_fp16 = const()[name = string("op_392_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(66544384)))]; tensor var_393_to_fp16 = const()[name = string("op_393_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68641600)))]; tensor linear_15_cast_fp16 = linear(bias = var_393_to_fp16, weight = var_392_to_fp16, x = x_35_cast_fp16)[name = string("linear_15_cast_fp16")]; tensor x_37_cast_fp16 = add(x = x_31_cast_fp16, y = linear_15_cast_fp16)[name = string("x_37_cast_fp16")]; tensor var_400_axes_0 = const()[name = string("op_400_axes_0"), val = tensor([-1])]; tensor blocks_2_mlp_ln_weight_to_fp16 = const()[name = string("blocks_2_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68643712)))]; tensor blocks_2_mlp_ln_bias_to_fp16 = const()[name = string("blocks_2_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68645824)))]; tensor var_400_cast_fp16 = layer_norm(axes = var_400_axes_0, beta = blocks_2_mlp_ln_bias_to_fp16, epsilon = var_326_to_fp16, gamma = blocks_2_mlp_ln_weight_to_fp16, x = x_37_cast_fp16)[name = string("op_400_cast_fp16")]; tensor var_409_to_fp16 = const()[name = string("op_409_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(68647936)))]; tensor var_410_to_fp16 = const()[name = string("op_410_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77036608)))]; tensor linear_16_cast_fp16 = linear(bias = var_410_to_fp16, weight = var_409_to_fp16, x = var_400_cast_fp16)[name = string("linear_16_cast_fp16")]; string x_41_mode_0 = const()[name = string("x_41_mode_0"), val = string("EXACT")]; tensor x_41_cast_fp16 = gelu(mode = x_41_mode_0, x = linear_16_cast_fp16)[name = string("x_41_cast_fp16")]; tensor var_415_to_fp16 = const()[name = string("op_415_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(77044864)))]; tensor var_416_to_fp16 = const()[name = string("op_416_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(85433536)))]; tensor linear_17_cast_fp16 = linear(bias = var_416_to_fp16, weight = var_415_to_fp16, x = x_41_cast_fp16)[name = string("linear_17_cast_fp16")]; tensor x_43_cast_fp16 = add(x = x_37_cast_fp16, y = linear_17_cast_fp16)[name = string("x_43_cast_fp16")]; int32 var_426 = const()[name = string("op_426"), val = int32(-1)]; tensor var_442_axes_0 = const()[name = string("op_442_axes_0"), val = tensor([-1])]; tensor blocks_3_attn_ln_weight_to_fp16 = const()[name = string("blocks_3_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(85435648)))]; tensor blocks_3_attn_ln_bias_to_fp16 = const()[name = string("blocks_3_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(85437760)))]; fp16 var_432_to_fp16 = const()[name = string("op_432_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_442_cast_fp16 = layer_norm(axes = var_442_axes_0, beta = blocks_3_attn_ln_bias_to_fp16, epsilon = var_432_to_fp16, gamma = blocks_3_attn_ln_weight_to_fp16, x = x_43_cast_fp16)[name = string("op_442_cast_fp16")]; tensor var_453_to_fp16 = const()[name = string("op_453_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(85439872)))]; tensor var_454_to_fp16 = const()[name = string("op_454_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(87537088)))]; tensor linear_18_cast_fp16 = linear(bias = var_454_to_fp16, weight = var_453_to_fp16, x = var_442_cast_fp16)[name = string("linear_18_cast_fp16")]; tensor var_457_to_fp16 = const()[name = string("op_457_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(87539200)))]; tensor linear_19_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_457_to_fp16, x = var_442_cast_fp16)[name = string("linear_19_cast_fp16")]; tensor var_461_to_fp16 = const()[name = string("op_461_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(89636416)))]; tensor var_462_to_fp16 = const()[name = string("op_462_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(91733632)))]; tensor linear_20_cast_fp16 = linear(bias = var_462_to_fp16, weight = var_461_to_fp16, x = var_442_cast_fp16)[name = string("linear_20_cast_fp16")]; tensor var_470 = const()[name = string("op_470"), val = tensor([1, 1500, 16, -1])]; tensor var_471_cast_fp16 = reshape(shape = var_470, x = linear_18_cast_fp16)[name = string("op_471_cast_fp16")]; tensor const_174_to_fp16 = const()[name = string("const_174_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_15_cast_fp16 = mul(x = var_471_cast_fp16, y = const_174_to_fp16)[name = string("q_15_cast_fp16")]; tensor var_477 = const()[name = string("op_477"), val = tensor([1, 1500, 16, -1])]; tensor var_478_cast_fp16 = reshape(shape = var_477, x = linear_19_cast_fp16)[name = string("op_478_cast_fp16")]; tensor const_175_to_fp16 = const()[name = string("const_175_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_15_cast_fp16 = mul(x = var_478_cast_fp16, y = const_175_to_fp16)[name = string("k_15_cast_fp16")]; tensor var_484 = const()[name = string("op_484"), val = tensor([1, 1500, 16, -1])]; tensor var_485_cast_fp16 = reshape(shape = var_484, x = linear_20_cast_fp16)[name = string("op_485_cast_fp16")]; tensor var_486 = const()[name = string("op_486"), val = tensor([0, 2, 1, 3])]; bool qk_7_transpose_x_0 = const()[name = string("qk_7_transpose_x_0"), val = bool(false)]; bool qk_7_transpose_y_0 = const()[name = string("qk_7_transpose_y_0"), val = bool(false)]; tensor transpose_102_perm_0 = const()[name = string("transpose_102_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_103_perm_0 = const()[name = string("transpose_103_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_103 = transpose(perm = transpose_103_perm_0, x = k_15_cast_fp16)[name = string("transpose_225")]; tensor transpose_102 = transpose(perm = transpose_102_perm_0, x = q_15_cast_fp16)[name = string("transpose_226")]; tensor qk_7_cast_fp16 = matmul(transpose_x = qk_7_transpose_x_0, transpose_y = qk_7_transpose_y_0, x = transpose_102, y = transpose_103)[name = string("qk_7_cast_fp16")]; tensor var_490_cast_fp16 = softmax(axis = var_426, x = qk_7_cast_fp16)[name = string("op_490_cast_fp16")]; bool var_492_transpose_x_0 = const()[name = string("op_492_transpose_x_0"), val = bool(false)]; bool var_492_transpose_y_0 = const()[name = string("op_492_transpose_y_0"), val = bool(false)]; tensor v_15_cast_fp16 = transpose(perm = var_486, x = var_485_cast_fp16)[name = string("transpose_227")]; tensor var_492_cast_fp16 = matmul(transpose_x = var_492_transpose_x_0, transpose_y = var_492_transpose_y_0, x = var_490_cast_fp16, y = v_15_cast_fp16)[name = string("op_492_cast_fp16")]; tensor var_493 = const()[name = string("op_493"), val = tensor([0, 2, 1, 3])]; tensor concat_3 = const()[name = string("concat_3"), val = tensor([1, 1500, 1024])]; tensor var_494_cast_fp16 = transpose(perm = var_493, x = var_492_cast_fp16)[name = string("transpose_224")]; tensor x_47_cast_fp16 = reshape(shape = concat_3, x = var_494_cast_fp16)[name = string("x_47_cast_fp16")]; tensor var_498_to_fp16 = const()[name = string("op_498_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(91735744)))]; tensor var_499_to_fp16 = const()[name = string("op_499_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93832960)))]; tensor linear_21_cast_fp16 = linear(bias = var_499_to_fp16, weight = var_498_to_fp16, x = x_47_cast_fp16)[name = string("linear_21_cast_fp16")]; tensor x_49_cast_fp16 = add(x = x_43_cast_fp16, y = linear_21_cast_fp16)[name = string("x_49_cast_fp16")]; tensor var_506_axes_0 = const()[name = string("op_506_axes_0"), val = tensor([-1])]; tensor blocks_3_mlp_ln_weight_to_fp16 = const()[name = string("blocks_3_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93835072)))]; tensor blocks_3_mlp_ln_bias_to_fp16 = const()[name = string("blocks_3_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93837184)))]; tensor var_506_cast_fp16 = layer_norm(axes = var_506_axes_0, beta = blocks_3_mlp_ln_bias_to_fp16, epsilon = var_432_to_fp16, gamma = blocks_3_mlp_ln_weight_to_fp16, x = x_49_cast_fp16)[name = string("op_506_cast_fp16")]; tensor var_515_to_fp16 = const()[name = string("op_515_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(93839296)))]; tensor var_516_to_fp16 = const()[name = string("op_516_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(102227968)))]; tensor linear_22_cast_fp16 = linear(bias = var_516_to_fp16, weight = var_515_to_fp16, x = var_506_cast_fp16)[name = string("linear_22_cast_fp16")]; string x_53_mode_0 = const()[name = string("x_53_mode_0"), val = string("EXACT")]; tensor x_53_cast_fp16 = gelu(mode = x_53_mode_0, x = linear_22_cast_fp16)[name = string("x_53_cast_fp16")]; tensor var_521_to_fp16 = const()[name = string("op_521_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(102236224)))]; tensor var_522_to_fp16 = const()[name = string("op_522_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(110624896)))]; tensor linear_23_cast_fp16 = linear(bias = var_522_to_fp16, weight = var_521_to_fp16, x = x_53_cast_fp16)[name = string("linear_23_cast_fp16")]; tensor x_55_cast_fp16 = add(x = x_49_cast_fp16, y = linear_23_cast_fp16)[name = string("x_55_cast_fp16")]; int32 var_532 = const()[name = string("op_532"), val = int32(-1)]; tensor var_548_axes_0 = const()[name = string("op_548_axes_0"), val = tensor([-1])]; tensor blocks_4_attn_ln_weight_to_fp16 = const()[name = string("blocks_4_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(110627008)))]; tensor blocks_4_attn_ln_bias_to_fp16 = const()[name = string("blocks_4_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(110629120)))]; fp16 var_538_to_fp16 = const()[name = string("op_538_to_fp16"), val = fp16(0x1.5p-17)]; tensor var_548_cast_fp16 = layer_norm(axes = var_548_axes_0, beta = blocks_4_attn_ln_bias_to_fp16, epsilon = var_538_to_fp16, gamma = blocks_4_attn_ln_weight_to_fp16, x = x_55_cast_fp16)[name = string("op_548_cast_fp16")]; tensor var_559_to_fp16 = const()[name = string("op_559_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(110631232)))]; tensor var_560_to_fp16 = const()[name = string("op_560_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(112728448)))]; tensor linear_24_cast_fp16 = linear(bias = var_560_to_fp16, weight = var_559_to_fp16, x = var_548_cast_fp16)[name = string("linear_24_cast_fp16")]; tensor var_563_to_fp16 = const()[name = string("op_563_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(112730560)))]; tensor linear_25_cast_fp16 = linear(bias = linear_1_bias_0_to_fp16, weight = var_563_to_fp16, x = var_548_cast_fp16)[name = string("linear_25_cast_fp16")]; tensor var_567_to_fp16 = const()[name = string("op_567_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(114827776)))]; tensor var_568_to_fp16 = const()[name = string("op_568_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(116924992)))]; tensor linear_26_cast_fp16 = linear(bias = var_568_to_fp16, weight = var_567_to_fp16, x = var_548_cast_fp16)[name = string("linear_26_cast_fp16")]; tensor var_576 = const()[name = string("op_576"), val = tensor([1, 1500, 16, -1])]; tensor var_577_cast_fp16 = reshape(shape = var_576, x = linear_24_cast_fp16)[name = string("op_577_cast_fp16")]; tensor const_176_to_fp16 = const()[name = string("const_176_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_19_cast_fp16 = mul(x = var_577_cast_fp16, y = const_176_to_fp16)[name = string("q_19_cast_fp16")]; tensor var_583 = const()[name = string("op_583"), val = tensor([1, 1500, 16, -1])]; tensor var_584_cast_fp16 = reshape(shape = var_583, x = linear_25_cast_fp16)[name = string("op_584_cast_fp16")]; tensor const_177_to_fp16 = const()[name = string("const_177_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_19_cast_fp16 = mul(x = var_584_cast_fp16, y = const_177_to_fp16)[name = string("k_19_cast_fp16")]; tensor var_590 = const()[name = string("op_590"), val = tensor([1, 1500, 16, -1])]; tensor var_591_cast_fp16 = reshape(shape = var_590, x = linear_26_cast_fp16)[name = string("op_591_cast_fp16")]; tensor var_592 = const()[name = string("op_592"), val = tensor([0, 2, 1, 3])]; bool qk_9_transpose_x_0 = const()[name = string("qk_9_transpose_x_0"), val = bool(false)]; bool qk_9_transpose_y_0 = const()[name = string("qk_9_transpose_y_0"), val = bool(false)]; tensor transpose_104_perm_0 = const()[name = string("transpose_104_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_105_perm_0 = const()[name = string("transpose_105_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_105 = transpose(perm = transpose_105_perm_0, x = k_19_cast_fp16)[name = string("transpose_221")]; tensor transpose_104 = transpose(perm = transpose_104_perm_0, x = q_19_cast_fp16)[name = string("transpose_222")]; tensor qk_9_cast_fp16 = matmul(transpose_x = qk_9_transpose_x_0, transpose_y = qk_9_transpose_y_0, x = transpose_104, y = transpose_105)[name = string("qk_9_cast_fp16")]; tensor var_596_cast_fp16 = softmax(axis = var_532, x = qk_9_cast_fp16)[name = string("op_596_cast_fp16")]; bool var_598_transpose_x_0 = const()[name = string("op_598_transpose_x_0"), val = bool(false)]; bool var_598_transpose_y_0 = const()[name = string("op_598_transpose_y_0"), val = bool(false)]; tensor v_19_cast_fp16 = transpose(perm = var_592, x = var_591_cast_fp16)[name = string("transpose_223")]; tensor var_598_cast_fp16 = matmul(transpose_x = var_598_transpose_x_0, transpose_y = var_598_transpose_y_0, x = var_596_cast_fp16, y = v_19_cast_fp16)[name = string("op_598_cast_fp16")]; tensor var_599 = const()[name = string("op_599"), val = tensor([0, 2, 1, 3])]; tensor concat_4 = const()[name = string("concat_4"), val = tensor([1, 1500, 1024])]; tensor var_600_cast_fp16 = transpose(perm = var_599, x = var_598_cast_fp16)[name = string("transpose_220")]; tensor x_59_cast_fp16 = reshape(shape = concat_4, x = var_600_cast_fp16)[name = string("x_59_cast_fp16")]; tensor