openai_whisper-large-v3-v20240930_turbo_632MB/TextDecoder.mlmodelc/model.mil
212.1 KB · 1025 lines · plaintext Raw
1 program(1.0)
2 [buildInfo = dict<tensor<string, []>, tensor<string, []>>({{"coremlc-component-MIL", "3304.5.2"}, {"coremlc-version", "3304.6.2"}})]
3 {
4 func main<ios16>(tensor<int32, [1]> cache_length, tensor<fp16, [1, 224]> decoder_key_padding_mask, tensor<fp16, [1, 1280, 1, 1500]> encoder_output_embeds, tensor<int32, [1]> input_ids, tensor<fp16, [1, 5120, 1, 224]> key_cache, tensor<fp16, [1, 224]> kv_cache_update_mask, tensor<fp16, [1, 5120, 1, 224]> value_cache) {
5 tensor<int32, []> var_24_axis_0 = const()[name = tensor<string, []>("op_24_axis_0"), val = tensor<int32, []>(0)];
6 tensor<int32, []> var_24_batch_dims_0 = const()[name = tensor<string, []>("op_24_batch_dims_0"), val = tensor<int32, []>(0)];
7 tensor<fp16, [51866, 1280]> embed_tokens_weight_to_fp16 = const()[name = tensor<string, []>("embed_tokens_weight_to_fp16"), val = tensor<fp16, [51866, 1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(64)))];
8 tensor<fp16, [1, 1280]> var_24_cast_fp16 = gather(axis = var_24_axis_0, batch_dims = var_24_batch_dims_0, indices = input_ids, x = embed_tokens_weight_to_fp16)[name = tensor<string, []>("op_24_cast_fp16")];
9 tensor<int32, []> var_31_axis_0 = const()[name = tensor<string, []>("op_31_axis_0"), val = tensor<int32, []>(0)];
10 tensor<int32, []> var_31_batch_dims_0 = const()[name = tensor<string, []>("op_31_batch_dims_0"), val = tensor<int32, []>(0)];
11 tensor<fp16, [448, 1280]> embed_positions_inlier_module_weight_to_fp16 = const()[name = tensor<string, []>("embed_positions_inlier_module_weight_to_fp16"), val = tensor<fp16, [448, 1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(132777088)))];
12 tensor<fp16, [1, 1280]> var_31_cast_fp16 = gather(axis = var_31_axis_0, batch_dims = var_31_batch_dims_0, indices = cache_length, x = embed_positions_inlier_module_weight_to_fp16)[name = tensor<string, []>("op_31_cast_fp16")];
13 tensor<int32, []> var_33_axis_0 = const()[name = tensor<string, []>("op_33_axis_0"), val = tensor<int32, []>(0)];
14 tensor<int32, []> var_33_batch_dims_0 = const()[name = tensor<string, []>("op_33_batch_dims_0"), val = tensor<int32, []>(0)];
15 tensor<fp16, [448, 1280]> embed_positions_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [71680]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(133941312))), name = tensor<string, []>("embed_positions_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [8582]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(133924032))), shape = tensor<uint32, [2]>([448, 1280])];
16 tensor<fp16, [1, 1280]> var_33_cast_fp16 = gather(axis = var_33_axis_0, batch_dims = var_33_batch_dims_0, indices = cache_length, x = embed_positions_outlier_module_weight_to_fp16_sparsified)[name = tensor<string, []>("op_33_cast_fp16")];
17 tensor<fp16, [1, 1280]> var_34_cast_fp16 = add(x = var_31_cast_fp16, y = var_33_cast_fp16)[name = tensor<string, []>("op_34_cast_fp16")];
18 tensor<fp16, [1, 1280]> hidden_states_1_cast_fp16 = add(x = var_24_cast_fp16, y = var_34_cast_fp16)[name = tensor<string, []>("hidden_states_1_cast_fp16")];
19 tensor<int32, [1]> var_48_axes_0 = const()[name = tensor<string, []>("op_48_axes_0"), val = tensor<int32, [1]>([2])];
20 tensor<fp16, [1, 1280, 1]> var_48_cast_fp16 = expand_dims(axes = var_48_axes_0, x = hidden_states_1_cast_fp16)[name = tensor<string, []>("op_48_cast_fp16")];
21 tensor<int32, [1]> inputs_1_axes_0 = const()[name = tensor<string, []>("inputs_1_axes_0"), val = tensor<int32, [1]>([3])];
22 tensor<fp16, [1, 1280, 1, 1]> inputs_1_cast_fp16 = expand_dims(axes = inputs_1_axes_0, x = var_48_cast_fp16)[name = tensor<string, []>("inputs_1_cast_fp16")];
23 tensor<int32, [4]> tile_0 = const()[name = tensor<string, []>("tile_0"), val = tensor<int32, [4]>([1280, 1280, 1280, 1280])];
24 tensor<int32, []> var_53_axis_0 = const()[name = tensor<string, []>("op_53_axis_0"), val = tensor<int32, []>(1)];
25 tensor<fp16, [1, 1280, 1, 224]> var_53_cast_fp16_0, tensor<fp16, [1, 1280, 1, 224]> var_53_cast_fp16_1, tensor<fp16, [1, 1280, 1, 224]> var_53_cast_fp16_2, tensor<fp16, [1, 1280, 1, 224]> var_53_cast_fp16_3 = split(axis = var_53_axis_0, split_sizes = tile_0, x = key_cache)[name = tensor<string, []>("op_53_cast_fp16")];
26 tensor<int32, [4]> tile_1 = const()[name = tensor<string, []>("tile_1"), val = tensor<int32, [4]>([1280, 1280, 1280, 1280])];
27 tensor<int32, []> var_60_axis_0 = const()[name = tensor<string, []>("op_60_axis_0"), val = tensor<int32, []>(1)];
28 tensor<fp16, [1, 1280, 1, 224]> var_60_cast_fp16_0, tensor<fp16, [1, 1280, 1, 224]> var_60_cast_fp16_1, tensor<fp16, [1, 1280, 1, 224]> var_60_cast_fp16_2, tensor<fp16, [1, 1280, 1, 224]> var_60_cast_fp16_3 = split(axis = var_60_axis_0, split_sizes = tile_1, x = value_cache)[name = tensor<string, []>("op_60_cast_fp16")];
29 tensor<int32, []> var_70 = const()[name = tensor<string, []>("op_70"), val = tensor<int32, []>(3)];
30 tensor<int32, [1]> out_1_axes_0 = const()[name = tensor<string, []>("out_1_axes_0"), val = tensor<int32, [1]>([1])];
31 tensor<fp16, []> var_96_to_fp16 = const()[name = tensor<string, []>("op_96_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
32 tensor<fp16, [1, 1280, 1, 1]> out_1_cast_fp16 = layer_norm(axes = out_1_axes_0, epsilon = var_96_to_fp16, x = inputs_1_cast_fp16)[name = tensor<string, []>("out_1_cast_fp16")];
33 tensor<fp16, [1280]> obj_1_mean_0_to_fp16 = const()[name = tensor<string, []>("obj_1_mean_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(134013056)))];
34 tensor<fp16, [1280]> obj_1_variance_0_to_fp16 = const()[name = tensor<string, []>("obj_1_variance_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(134015680)))];
35 tensor<fp16, [1280]> obj_1_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_1_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(134018304)))];
36 tensor<fp16, [1280]> obj_1_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_1_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(134020928)))];
37 tensor<fp16, []> obj_1_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_1_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
38 tensor<fp16, [1, 1280, 1, 1]> obj_1_cast_fp16 = batch_norm(beta = obj_1_beta_0_to_fp16, epsilon = obj_1_epsilon_0_to_fp16, gamma = obj_1_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_1_cast_fp16)[name = tensor<string, []>("obj_1_cast_fp16")];
39 tensor<string, []> var_118_pad_type_0 = const()[name = tensor<string, []>("op_118_pad_type_0"), val = tensor<string, []>("valid")];
40 tensor<int32, [2]> var_118_strides_0 = const()[name = tensor<string, []>("op_118_strides_0"), val = tensor<int32, [2]>([1, 1])];
41 tensor<int32, [4]> var_118_pad_0 = const()[name = tensor<string, []>("op_118_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
42 tensor<int32, [2]> var_118_dilations_0 = const()[name = tensor<string, []>("op_118_dilations_0"), val = tensor<int32, [2]>([1, 1])];
43 tensor<int32, []> var_118_groups_0 = const()[name = tensor<string, []>("op_118_groups_0"), val = tensor<int32, []>(1)];
44 tensor<fp16, [1280, 1280, 1, 1]> layers_0_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(134023552))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(134842816))), name = tensor<string, []>("layers_0_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
45 tensor<fp16, [1280]> layers_0_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(134842944)))];
46 tensor<fp16, [1, 1280, 1, 1]> var_118_cast_fp16 = conv(bias = layers_0_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_118_dilations_0, groups = var_118_groups_0, pad = var_118_pad_0, pad_type = var_118_pad_type_0, strides = var_118_strides_0, weight = layers_0_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_1_cast_fp16)[name = tensor<string, []>("op_118_cast_fp16")];
47 tensor<string, []> var_124_pad_type_0 = const()[name = tensor<string, []>("op_124_pad_type_0"), val = tensor<string, []>("valid")];
48 tensor<int32, [2]> var_124_strides_0 = const()[name = tensor<string, []>("op_124_strides_0"), val = tensor<int32, [2]>([1, 1])];
49 tensor<int32, [4]> var_124_pad_0 = const()[name = tensor<string, []>("op_124_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
50 tensor<int32, [2]> var_124_dilations_0 = const()[name = tensor<string, []>("op_124_dilations_0"), val = tensor<int32, [2]>([1, 1])];
51 tensor<int32, []> var_124_groups_0 = const()[name = tensor<string, []>("op_124_groups_0"), val = tensor<int32, []>(1)];
52 tensor<fp16, [1280, 1280, 1, 1]> layers_0_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(134918592))), name = tensor<string, []>("layers_0_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [36461]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(134845568))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
53 tensor<fp16, [1, 1280, 1, 1]> var_124_cast_fp16 = conv(dilations = var_124_dilations_0, groups = var_124_groups_0, pad = var_124_pad_0, pad_type = var_124_pad_type_0, strides = var_124_strides_0, weight = layers_0_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_1_cast_fp16)[name = tensor<string, []>("op_124_cast_fp16")];
54 tensor<fp16, [1, 1280, 1, 1]> query_1_cast_fp16 = add(x = var_118_cast_fp16, y = var_124_cast_fp16)[name = tensor<string, []>("query_1_cast_fp16")];
55 tensor<string, []> var_133_pad_type_0 = const()[name = tensor<string, []>("op_133_pad_type_0"), val = tensor<string, []>("valid")];
56 tensor<int32, [2]> var_133_strides_0 = const()[name = tensor<string, []>("op_133_strides_0"), val = tensor<int32, [2]>([1, 1])];
57 tensor<int32, [4]> var_133_pad_0 = const()[name = tensor<string, []>("op_133_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
58 tensor<int32, [2]> var_133_dilations_0 = const()[name = tensor<string, []>("op_133_dilations_0"), val = tensor<int32, [2]>([1, 1])];
59 tensor<int32, []> var_133_groups_0 = const()[name = tensor<string, []>("op_133_groups_0"), val = tensor<int32, []>(1)];
60 tensor<fp16, [1280, 1280, 1, 1]> layers_0_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(135123456))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(135942720))), name = tensor<string, []>("layers_0_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
61 tensor<fp16, [1, 1280, 1, 1]> var_133_cast_fp16 = conv(dilations = var_133_dilations_0, groups = var_133_groups_0, pad = var_133_pad_0, pad_type = var_133_pad_type_0, strides = var_133_strides_0, weight = layers_0_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_1_cast_fp16)[name = tensor<string, []>("op_133_cast_fp16")];
62 tensor<string, []> var_139_pad_type_0 = const()[name = tensor<string, []>("op_139_pad_type_0"), val = tensor<string, []>("valid")];
63 tensor<int32, [2]> var_139_strides_0 = const()[name = tensor<string, []>("op_139_strides_0"), val = tensor<int32, [2]>([1, 1])];
64 tensor<int32, [4]> var_139_pad_0 = const()[name = tensor<string, []>("op_139_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
65 tensor<int32, [2]> var_139_dilations_0 = const()[name = tensor<string, []>("op_139_dilations_0"), val = tensor<int32, [2]>([1, 1])];
66 tensor<int32, []> var_139_groups_0 = const()[name = tensor<string, []>("op_139_groups_0"), val = tensor<int32, []>(1)];
67 tensor<fp16, [1280, 1280, 1, 1]> layers_0_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(135976320))), name = tensor<string, []>("layers_0_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [16673]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(135942848))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
68 tensor<fp16, [1, 1280, 1, 1]> var_139_cast_fp16 = conv(dilations = var_139_dilations_0, groups = var_139_groups_0, pad = var_139_pad_0, pad_type = var_139_pad_type_0, strides = var_139_strides_0, weight = layers_0_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_1_cast_fp16)[name = tensor<string, []>("op_139_cast_fp16")];
69 tensor<fp16, [1, 1280, 1, 1]> current_key_1_cast_fp16 = add(x = var_133_cast_fp16, y = var_139_cast_fp16)[name = tensor<string, []>("current_key_1_cast_fp16")];
70 tensor<string, []> var_149_pad_type_0 = const()[name = tensor<string, []>("op_149_pad_type_0"), val = tensor<string, []>("valid")];
71 tensor<int32, [2]> var_149_strides_0 = const()[name = tensor<string, []>("op_149_strides_0"), val = tensor<int32, [2]>([1, 1])];
72 tensor<int32, [4]> var_149_pad_0 = const()[name = tensor<string, []>("op_149_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
73 tensor<int32, [2]> var_149_dilations_0 = const()[name = tensor<string, []>("op_149_dilations_0"), val = tensor<int32, [2]>([1, 1])];
74 tensor<int32, []> var_149_groups_0 = const()[name = tensor<string, []>("op_149_groups_0"), val = tensor<int32, []>(1)];
75 tensor<fp16, [1280, 1280, 1, 1]> layers_0_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(136181184))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(137000448))), name = tensor<string, []>("layers_0_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
76 tensor<fp16, [1280]> layers_0_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(137000576)))];
77 tensor<fp16, [1, 1280, 1, 1]> var_149_cast_fp16 = conv(bias = layers_0_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_149_dilations_0, groups = var_149_groups_0, pad = var_149_pad_0, pad_type = var_149_pad_type_0, strides = var_149_strides_0, weight = layers_0_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_1_cast_fp16)[name = tensor<string, []>("op_149_cast_fp16")];
78 tensor<string, []> var_155_pad_type_0 = const()[name = tensor<string, []>("op_155_pad_type_0"), val = tensor<string, []>("valid")];
79 tensor<int32, [2]> var_155_strides_0 = const()[name = tensor<string, []>("op_155_strides_0"), val = tensor<int32, [2]>([1, 1])];
80 tensor<int32, [4]> var_155_pad_0 = const()[name = tensor<string, []>("op_155_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
81 tensor<int32, [2]> var_155_dilations_0 = const()[name = tensor<string, []>("op_155_dilations_0"), val = tensor<int32, [2]>([1, 1])];
82 tensor<int32, []> var_155_groups_0 = const()[name = tensor<string, []>("op_155_groups_0"), val = tensor<int32, []>(1)];
83 tensor<fp16, [1280, 1280, 1, 1]> layers_0_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(137046720))), name = tensor<string, []>("layers_0_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [21721]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(137003200))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
84 tensor<fp16, [1, 1280, 1, 1]> var_155_cast_fp16 = conv(dilations = var_155_dilations_0, groups = var_155_groups_0, pad = var_155_pad_0, pad_type = var_155_pad_type_0, strides = var_155_strides_0, weight = layers_0_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_1_cast_fp16)[name = tensor<string, []>("op_155_cast_fp16")];
85 tensor<fp16, [1, 1280, 1, 1]> current_value_1_cast_fp16 = add(x = var_149_cast_fp16, y = var_155_cast_fp16)[name = tensor<string, []>("current_value_1_cast_fp16")];
86 tensor<int32, [1]> var_158_axes_0 = const()[name = tensor<string, []>("op_158_axes_0"), val = tensor<int32, [1]>([1])];
87 tensor<fp16, [1, 1, 224]> var_158_cast_fp16 = expand_dims(axes = var_158_axes_0, x = kv_cache_update_mask)[name = tensor<string, []>("op_158_cast_fp16")];
88 tensor<int32, [1]> var_159_axes_0 = const()[name = tensor<string, []>("op_159_axes_0"), val = tensor<int32, [1]>([2])];
89 tensor<fp16, [1, 1, 1, 224]> var_159_cast_fp16 = expand_dims(axes = var_159_axes_0, x = var_158_cast_fp16)[name = tensor<string, []>("op_159_cast_fp16")];
90 tensor<fp16, [1, 1280, 1, 224]> var_161_cast_fp16 = mul(x = current_key_1_cast_fp16, y = var_159_cast_fp16)[name = tensor<string, []>("op_161_cast_fp16")];
91 tensor<fp16, []> var_71_to_fp16 = const()[name = tensor<string, []>("op_71_to_fp16"), val = tensor<fp16, []>(0x1p+0)];
92 tensor<fp16, [1, 1, 1, 224]> var_162_cast_fp16 = sub(x = var_71_to_fp16, y = var_159_cast_fp16)[name = tensor<string, []>("op_162_cast_fp16")];
93 tensor<fp16, [1, 1280, 1, 224]> var_163_cast_fp16 = mul(x = var_53_cast_fp16_0, y = var_162_cast_fp16)[name = tensor<string, []>("op_163_cast_fp16")];
94 tensor<fp16, [1, 1280, 1, 224]> key_1_cast_fp16 = add(x = var_161_cast_fp16, y = var_163_cast_fp16)[name = tensor<string, []>("key_1_cast_fp16")];
95 tensor<fp16, [1, 1280, 1, 224]> var_165_cast_fp16 = mul(x = current_value_1_cast_fp16, y = var_159_cast_fp16)[name = tensor<string, []>("op_165_cast_fp16")];
96 tensor<fp16, [1, 1280, 1, 224]> var_167_cast_fp16 = mul(x = var_60_cast_fp16_0, y = var_162_cast_fp16)[name = tensor<string, []>("op_167_cast_fp16")];
97 tensor<fp16, [1, 1280, 1, 224]> value_1_cast_fp16 = add(x = var_165_cast_fp16, y = var_167_cast_fp16)[name = tensor<string, []>("value_1_cast_fp16")];
98 tensor<int32, [4]> var_170 = const()[name = tensor<string, []>("op_170"), val = tensor<int32, [4]>([1, 20, 64, -1])];
99 tensor<fp16, [1, 20, 64, 1]> mh_q_1_cast_fp16 = reshape(shape = var_170, x = query_1_cast_fp16)[name = tensor<string, []>("mh_q_1_cast_fp16")];
100 tensor<fp16, []> var_172_to_fp16 = const()[name = tensor<string, []>("op_172_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
101 tensor<fp16, [1, 20, 64, 1]> var_173_cast_fp16 = mul(x = mh_q_1_cast_fp16, y = var_172_to_fp16)[name = tensor<string, []>("op_173_cast_fp16")];
102 tensor<int32, [4]> var_174 = const()[name = tensor<string, []>("op_174"), val = tensor<int32, [4]>([1, 20, 64, -1])];
103 tensor<fp16, [1, 20, 64, 224]> var_175_cast_fp16 = reshape(shape = var_174, x = key_1_cast_fp16)[name = tensor<string, []>("op_175_cast_fp16")];
104 tensor<bool, []> mh_w_1_transpose_x_0 = const()[name = tensor<string, []>("mh_w_1_transpose_x_0"), val = tensor<bool, []>(true)];
105 tensor<bool, []> mh_w_1_transpose_y_0 = const()[name = tensor<string, []>("mh_w_1_transpose_y_0"), val = tensor<bool, []>(false)];
106 tensor<fp16, [1, 20, 1, 224]> mh_w_1_cast_fp16 = matmul(transpose_x = mh_w_1_transpose_x_0, transpose_y = mh_w_1_transpose_y_0, x = var_173_cast_fp16, y = var_175_cast_fp16)[name = tensor<string, []>("mh_w_1_cast_fp16")];
107 tensor<int32, [1]> var_179_axes_0 = const()[name = tensor<string, []>("op_179_axes_0"), val = tensor<int32, [1]>([1])];
108 tensor<fp16, [1, 1, 224]> var_179_cast_fp16 = expand_dims(axes = var_179_axes_0, x = decoder_key_padding_mask)[name = tensor<string, []>("op_179_cast_fp16")];
109 tensor<int32, [1]> var_180_axes_0 = const()[name = tensor<string, []>("op_180_axes_0"), val = tensor<int32, [1]>([2])];
110 tensor<fp16, [1, 1, 1, 224]> var_180_cast_fp16 = expand_dims(axes = var_180_axes_0, x = var_179_cast_fp16)[name = tensor<string, []>("op_180_cast_fp16")];
111 tensor<fp16, [1, 20, 1, 224]> mh_w_3_cast_fp16 = add(x = mh_w_1_cast_fp16, y = var_180_cast_fp16)[name = tensor<string, []>("mh_w_3_cast_fp16")];
112 tensor<fp16, [1, 20, 1, 224]> var_183_cast_fp16 = softmax(axis = var_70, x = mh_w_3_cast_fp16)[name = tensor<string, []>("op_183_cast_fp16")];
113 tensor<int32, [4]> var_184 = const()[name = tensor<string, []>("op_184"), val = tensor<int32, [4]>([1, 20, 64, -1])];
114 tensor<fp16, [1, 20, 64, 224]> var_185_cast_fp16 = reshape(shape = var_184, x = value_1_cast_fp16)[name = tensor<string, []>("op_185_cast_fp16")];
115 tensor<bool, []> attn_1_transpose_x_0 = const()[name = tensor<string, []>("attn_1_transpose_x_0"), val = tensor<bool, []>(false)];
116 tensor<bool, []> attn_1_transpose_y_0 = const()[name = tensor<string, []>("attn_1_transpose_y_0"), val = tensor<bool, []>(true)];
117 tensor<fp16, [1, 20, 64, 1]> attn_1_cast_fp16 = matmul(transpose_x = attn_1_transpose_x_0, transpose_y = attn_1_transpose_y_0, x = var_185_cast_fp16, y = var_183_cast_fp16)[name = tensor<string, []>("attn_1_cast_fp16")];
118 tensor<int32, [4]> var_188 = const()[name = tensor<string, []>("op_188"), val = tensor<int32, [4]>([1, 1280, 1, -1])];
119 tensor<fp16, [1, 1280, 1, 1]> input_1_cast_fp16 = reshape(shape = var_188, x = attn_1_cast_fp16)[name = tensor<string, []>("input_1_cast_fp16")];
120 tensor<string, []> var_198_pad_type_0 = const()[name = tensor<string, []>("op_198_pad_type_0"), val = tensor<string, []>("valid")];
121 tensor<int32, [2]> var_198_strides_0 = const()[name = tensor<string, []>("op_198_strides_0"), val = tensor<int32, [2]>([1, 1])];
122 tensor<int32, [4]> var_198_pad_0 = const()[name = tensor<string, []>("op_198_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
123 tensor<int32, [2]> var_198_dilations_0 = const()[name = tensor<string, []>("op_198_dilations_0"), val = tensor<int32, [2]>([1, 1])];
124 tensor<int32, []> var_198_groups_0 = const()[name = tensor<string, []>("op_198_groups_0"), val = tensor<int32, []>(1)];
125 tensor<fp16, [1280, 1280, 1, 1]> layers_0_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(137251584))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(138070848))), name = tensor<string, []>("layers_0_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
126 tensor<fp16, [1280]> layers_0_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(138070976)))];
127 tensor<fp16, [1, 1280, 1, 1]> var_198_cast_fp16 = conv(bias = layers_0_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_198_dilations_0, groups = var_198_groups_0, pad = var_198_pad_0, pad_type = var_198_pad_type_0, strides = var_198_strides_0, weight = layers_0_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_1_cast_fp16)[name = tensor<string, []>("op_198_cast_fp16")];
128 tensor<string, []> var_204_pad_type_0 = const()[name = tensor<string, []>("op_204_pad_type_0"), val = tensor<string, []>("valid")];
129 tensor<int32, [2]> var_204_strides_0 = const()[name = tensor<string, []>("op_204_strides_0"), val = tensor<int32, [2]>([1, 1])];
130 tensor<int32, [4]> var_204_pad_0 = const()[name = tensor<string, []>("op_204_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
131 tensor<int32, [2]> var_204_dilations_0 = const()[name = tensor<string, []>("op_204_dilations_0"), val = tensor<int32, [2]>([1, 1])];
132 tensor<int32, []> var_204_groups_0 = const()[name = tensor<string, []>("op_204_groups_0"), val = tensor<int32, []>(1)];
133 tensor<fp16, [1280, 1280, 1, 1]> layers_0_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(138130624))), name = tensor<string, []>("layers_0_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [28455]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(138073600))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
134 tensor<fp16, [1, 1280, 1, 1]> var_204_cast_fp16 = conv(dilations = var_204_dilations_0, groups = var_204_groups_0, pad = var_204_pad_0, pad_type = var_204_pad_type_0, strides = var_204_strides_0, weight = layers_0_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_1_cast_fp16)[name = tensor<string, []>("op_204_cast_fp16")];
135 tensor<fp16, [1, 1280, 1, 1]> obj_7_cast_fp16 = add(x = var_198_cast_fp16, y = var_204_cast_fp16)[name = tensor<string, []>("obj_7_cast_fp16")];
136 tensor<fp16, [1, 1280, 1, 1]> inputs_3_cast_fp16 = add(x = inputs_1_cast_fp16, y = obj_7_cast_fp16)[name = tensor<string, []>("inputs_3_cast_fp16")];
137 tensor<int32, [1]> out_3_axes_0 = const()[name = tensor<string, []>("out_3_axes_0"), val = tensor<int32, [1]>([1])];
138 tensor<fp16, []> var_219_to_fp16 = const()[name = tensor<string, []>("op_219_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
139 tensor<fp16, [1, 1280, 1, 1]> out_3_cast_fp16 = layer_norm(axes = out_3_axes_0, epsilon = var_219_to_fp16, x = inputs_3_cast_fp16)[name = tensor<string, []>("out_3_cast_fp16")];
140 tensor<fp16, [1280]> obj_9_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_9_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(138335488)))];
141 tensor<fp16, [1280]> obj_9_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_9_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(138338112)))];
142 tensor<fp16, []> obj_9_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_9_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
143 tensor<fp16, [1, 1280, 1, 1]> obj_9_cast_fp16 = batch_norm(beta = obj_9_beta_0_to_fp16, epsilon = obj_9_epsilon_0_to_fp16, gamma = obj_9_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_3_cast_fp16)[name = tensor<string, []>("obj_9_cast_fp16")];
144 tensor<string, []> var_241_pad_type_0 = const()[name = tensor<string, []>("op_241_pad_type_0"), val = tensor<string, []>("valid")];
145 tensor<int32, [2]> var_241_strides_0 = const()[name = tensor<string, []>("op_241_strides_0"), val = tensor<int32, [2]>([1, 1])];
146 tensor<int32, [4]> var_241_pad_0 = const()[name = tensor<string, []>("op_241_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
147 tensor<int32, [2]> var_241_dilations_0 = const()[name = tensor<string, []>("op_241_dilations_0"), val = tensor<int32, [2]>([1, 1])];
148 tensor<int32, []> var_241_groups_0 = const()[name = tensor<string, []>("op_241_groups_0"), val = tensor<int32, []>(1)];
149 tensor<fp16, [1280, 1280, 1, 1]> layers_0_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(138340736))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(139160000))), name = tensor<string, []>("layers_0_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
150 tensor<fp16, [1280]> layers_0_encoder_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_encoder_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(139160128)))];
151 tensor<fp16, [1, 1280, 1, 1]> var_241_cast_fp16 = conv(bias = layers_0_encoder_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_241_dilations_0, groups = var_241_groups_0, pad = var_241_pad_0, pad_type = var_241_pad_type_0, strides = var_241_strides_0, weight = layers_0_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_9_cast_fp16)[name = tensor<string, []>("op_241_cast_fp16")];
152 tensor<string, []> var_247_pad_type_0 = const()[name = tensor<string, []>("op_247_pad_type_0"), val = tensor<string, []>("valid")];
153 tensor<int32, [2]> var_247_strides_0 = const()[name = tensor<string, []>("op_247_strides_0"), val = tensor<int32, [2]>([1, 1])];
154 tensor<int32, [4]> var_247_pad_0 = const()[name = tensor<string, []>("op_247_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
155 tensor<int32, [2]> var_247_dilations_0 = const()[name = tensor<string, []>("op_247_dilations_0"), val = tensor<int32, [2]>([1, 1])];
156 tensor<int32, []> var_247_groups_0 = const()[name = tensor<string, []>("op_247_groups_0"), val = tensor<int32, []>(1)];
157 tensor<fp16, [1280, 1280, 1, 1]> layers_0_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(139188224))), name = tensor<string, []>("layers_0_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [12701]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(139162752))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
158 tensor<fp16, [1, 1280, 1, 1]> var_247_cast_fp16 = conv(dilations = var_247_dilations_0, groups = var_247_groups_0, pad = var_247_pad_0, pad_type = var_247_pad_type_0, strides = var_247_strides_0, weight = layers_0_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_9_cast_fp16)[name = tensor<string, []>("op_247_cast_fp16")];
159 tensor<fp16, [1, 1280, 1, 1]> query_3_cast_fp16 = add(x = var_241_cast_fp16, y = var_247_cast_fp16)[name = tensor<string, []>("query_3_cast_fp16")];
160 tensor<string, []> var_256_pad_type_0 = const()[name = tensor<string, []>("op_256_pad_type_0"), val = tensor<string, []>("valid")];
161 tensor<int32, [2]> var_256_strides_0 = const()[name = tensor<string, []>("op_256_strides_0"), val = tensor<int32, [2]>([1, 1])];
162 tensor<int32, [4]> var_256_pad_0 = const()[name = tensor<string, []>("op_256_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
163 tensor<int32, [2]> var_256_dilations_0 = const()[name = tensor<string, []>("op_256_dilations_0"), val = tensor<int32, [2]>([1, 1])];
164 tensor<int32, []> var_256_groups_0 = const()[name = tensor<string, []>("op_256_groups_0"), val = tensor<int32, []>(1)];
165 tensor<fp16, [1280, 1280, 1, 1]> layers_0_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(139393088))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(140212352))), name = tensor<string, []>("layers_0_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
166 tensor<fp16, [1, 1280, 1, 1500]> var_256_cast_fp16 = conv(dilations = var_256_dilations_0, groups = var_256_groups_0, pad = var_256_pad_0, pad_type = var_256_pad_type_0, strides = var_256_strides_0, weight = layers_0_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor<string, []>("op_256_cast_fp16")];
167 tensor<string, []> var_262_pad_type_0 = const()[name = tensor<string, []>("op_262_pad_type_0"), val = tensor<string, []>("valid")];
168 tensor<int32, [2]> var_262_strides_0 = const()[name = tensor<string, []>("op_262_strides_0"), val = tensor<int32, [2]>([1, 1])];
169 tensor<int32, [4]> var_262_pad_0 = const()[name = tensor<string, []>("op_262_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
170 tensor<int32, [2]> var_262_dilations_0 = const()[name = tensor<string, []>("op_262_dilations_0"), val = tensor<int32, [2]>([1, 1])];
171 tensor<int32, []> var_262_groups_0 = const()[name = tensor<string, []>("op_262_groups_0"), val = tensor<int32, []>(1)];
172 tensor<fp16, [1280, 1280, 1, 1]> layers_0_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(140272448))), name = tensor<string, []>("layers_0_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [29949]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(140212480))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
173 tensor<fp16, [1, 1280, 1, 1500]> var_262_cast_fp16 = conv(dilations = var_262_dilations_0, groups = var_262_groups_0, pad = var_262_pad_0, pad_type = var_262_pad_type_0, strides = var_262_strides_0, weight = layers_0_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = encoder_output_embeds)[name = tensor<string, []>("op_262_cast_fp16")];
174 tensor<fp16, [1, 1280, 1, 1500]> key_3_cast_fp16 = add(x = var_256_cast_fp16, y = var_262_cast_fp16)[name = tensor<string, []>("key_3_cast_fp16")];
175 tensor<string, []> var_272_pad_type_0 = const()[name = tensor<string, []>("op_272_pad_type_0"), val = tensor<string, []>("valid")];
176 tensor<int32, [2]> var_272_strides_0 = const()[name = tensor<string, []>("op_272_strides_0"), val = tensor<int32, [2]>([1, 1])];
177 tensor<int32, [4]> var_272_pad_0 = const()[name = tensor<string, []>("op_272_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
178 tensor<int32, [2]> var_272_dilations_0 = const()[name = tensor<string, []>("op_272_dilations_0"), val = tensor<int32, [2]>([1, 1])];
179 tensor<int32, []> var_272_groups_0 = const()[name = tensor<string, []>("op_272_groups_0"), val = tensor<int32, []>(1)];
180 tensor<fp16, [1280, 1280, 1, 1]> layers_0_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(140477312))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(141296576))), name = tensor<string, []>("layers_0_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
181 tensor<fp16, [1280]> layers_0_encoder_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_encoder_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(141296704)))];
182 tensor<fp16, [1, 1280, 1, 1500]> var_272_cast_fp16 = conv(bias = layers_0_encoder_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_272_dilations_0, groups = var_272_groups_0, pad = var_272_pad_0, pad_type = var_272_pad_type_0, strides = var_272_strides_0, weight = layers_0_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor<string, []>("op_272_cast_fp16")];
183 tensor<string, []> var_278_pad_type_0 = const()[name = tensor<string, []>("op_278_pad_type_0"), val = tensor<string, []>("valid")];
184 tensor<int32, [2]> var_278_strides_0 = const()[name = tensor<string, []>("op_278_strides_0"), val = tensor<int32, [2]>([1, 1])];
185 tensor<int32, [4]> var_278_pad_0 = const()[name = tensor<string, []>("op_278_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
186 tensor<int32, [2]> var_278_dilations_0 = const()[name = tensor<string, []>("op_278_dilations_0"), val = tensor<int32, [2]>([1, 1])];
187 tensor<int32, []> var_278_groups_0 = const()[name = tensor<string, []>("op_278_groups_0"), val = tensor<int32, []>(1)];
188 tensor<fp16, [1280, 1280, 1, 1]> layers_0_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(141310592))), name = tensor<string, []>("layers_0_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5596]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(141299328))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
189 tensor<fp16, [1, 1280, 1, 1500]> var_278_cast_fp16 = conv(dilations = var_278_dilations_0, groups = var_278_groups_0, pad = var_278_pad_0, pad_type = var_278_pad_type_0, strides = var_278_strides_0, weight = layers_0_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = encoder_output_embeds)[name = tensor<string, []>("op_278_cast_fp16")];
190 tensor<fp16, [1, 1280, 1, 1500]> value_3_cast_fp16 = add(x = var_272_cast_fp16, y = var_278_cast_fp16)[name = tensor<string, []>("value_3_cast_fp16")];
191 tensor<int32, [4]> var_281 = const()[name = tensor<string, []>("op_281"), val = tensor<int32, [4]>([1, 20, 64, -1])];
192 tensor<fp16, [1, 20, 64, 1]> mh_q_3_cast_fp16 = reshape(shape = var_281, x = query_3_cast_fp16)[name = tensor<string, []>("mh_q_3_cast_fp16")];
193 tensor<fp16, []> var_283_to_fp16 = const()[name = tensor<string, []>("op_283_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
194 tensor<fp16, [1, 20, 64, 1]> var_284_cast_fp16 = mul(x = mh_q_3_cast_fp16, y = var_283_to_fp16)[name = tensor<string, []>("op_284_cast_fp16")];
195 tensor<int32, [4]> var_285 = const()[name = tensor<string, []>("op_285"), val = tensor<int32, [4]>([1, 20, 64, -1])];
196 tensor<fp16, [1, 20, 64, 1500]> var_286_cast_fp16 = reshape(shape = var_285, x = key_3_cast_fp16)[name = tensor<string, []>("op_286_cast_fp16")];
197 tensor<bool, []> mh_w_5_transpose_x_0 = const()[name = tensor<string, []>("mh_w_5_transpose_x_0"), val = tensor<bool, []>(true)];
198 tensor<bool, []> mh_w_5_transpose_y_0 = const()[name = tensor<string, []>("mh_w_5_transpose_y_0"), val = tensor<bool, []>(false)];
199 tensor<fp16, [1, 20, 1, 1500]> mh_w_5_cast_fp16 = matmul(transpose_x = mh_w_5_transpose_x_0, transpose_y = mh_w_5_transpose_y_0, x = var_284_cast_fp16, y = var_286_cast_fp16)[name = tensor<string, []>("mh_w_5_cast_fp16")];
200 tensor<fp16, [1, 20, 1, 1500]> obj_13_cast_fp16 = softmax(axis = var_70, x = mh_w_5_cast_fp16)[name = tensor<string, []>("obj_13_cast_fp16")];
201 tensor<int32, [4]> var_290 = const()[name = tensor<string, []>("op_290"), val = tensor<int32, [4]>([1, 20, 64, -1])];
202 tensor<fp16, [1, 20, 64, 1500]> var_291_cast_fp16 = reshape(shape = var_290, x = value_3_cast_fp16)[name = tensor<string, []>("op_291_cast_fp16")];
203 tensor<bool, []> attn_3_transpose_x_0 = const()[name = tensor<string, []>("attn_3_transpose_x_0"), val = tensor<bool, []>(false)];
204 tensor<bool, []> attn_3_transpose_y_0 = const()[name = tensor<string, []>("attn_3_transpose_y_0"), val = tensor<bool, []>(true)];
205 tensor<fp16, [1, 20, 64, 1]> attn_3_cast_fp16 = matmul(transpose_x = attn_3_transpose_x_0, transpose_y = attn_3_transpose_y_0, x = var_291_cast_fp16, y = obj_13_cast_fp16)[name = tensor<string, []>("attn_3_cast_fp16")];
206 tensor<int32, [4]> var_294 = const()[name = tensor<string, []>("op_294"), val = tensor<int32, [4]>([1, 1280, 1, -1])];
207 tensor<fp16, [1, 1280, 1, 1]> input_3_cast_fp16 = reshape(shape = var_294, x = attn_3_cast_fp16)[name = tensor<string, []>("input_3_cast_fp16")];
208 tensor<string, []> var_304_pad_type_0 = const()[name = tensor<string, []>("op_304_pad_type_0"), val = tensor<string, []>("valid")];
209 tensor<int32, [2]> var_304_strides_0 = const()[name = tensor<string, []>("op_304_strides_0"), val = tensor<int32, [2]>([1, 1])];
210 tensor<int32, [4]> var_304_pad_0 = const()[name = tensor<string, []>("op_304_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
211 tensor<int32, [2]> var_304_dilations_0 = const()[name = tensor<string, []>("op_304_dilations_0"), val = tensor<int32, [2]>([1, 1])];
212 tensor<int32, []> var_304_groups_0 = const()[name = tensor<string, []>("op_304_groups_0"), val = tensor<int32, []>(1)];
213 tensor<fp16, [1280, 1280, 1, 1]> layers_0_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(141515456))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(142334720))), name = tensor<string, []>("layers_0_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
214 tensor<fp16, [1280]> layers_0_encoder_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_encoder_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(142334848)))];
215 tensor<fp16, [1, 1280, 1, 1]> var_304_cast_fp16 = conv(bias = layers_0_encoder_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_304_dilations_0, groups = var_304_groups_0, pad = var_304_pad_0, pad_type = var_304_pad_type_0, strides = var_304_strides_0, weight = layers_0_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_3_cast_fp16)[name = tensor<string, []>("op_304_cast_fp16")];
216 tensor<string, []> var_310_pad_type_0 = const()[name = tensor<string, []>("op_310_pad_type_0"), val = tensor<string, []>("valid")];
217 tensor<int32, [2]> var_310_strides_0 = const()[name = tensor<string, []>("op_310_strides_0"), val = tensor<int32, [2]>([1, 1])];
218 tensor<int32, [4]> var_310_pad_0 = const()[name = tensor<string, []>("op_310_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
219 tensor<int32, [2]> var_310_dilations_0 = const()[name = tensor<string, []>("op_310_dilations_0"), val = tensor<int32, [2]>([1, 1])];
220 tensor<int32, []> var_310_groups_0 = const()[name = tensor<string, []>("op_310_groups_0"), val = tensor<int32, []>(1)];
221 tensor<fp16, [1280, 1280, 1, 1]> layers_0_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(142349632))), name = tensor<string, []>("layers_0_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [6041]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(142337472))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
222 tensor<fp16, [1, 1280, 1, 1]> var_310_cast_fp16 = conv(dilations = var_310_dilations_0, groups = var_310_groups_0, pad = var_310_pad_0, pad_type = var_310_pad_type_0, strides = var_310_strides_0, weight = layers_0_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_3_cast_fp16)[name = tensor<string, []>("op_310_cast_fp16")];
223 tensor<fp16, [1, 1280, 1, 1]> obj_11_cast_fp16 = add(x = var_304_cast_fp16, y = var_310_cast_fp16)[name = tensor<string, []>("obj_11_cast_fp16")];
224 tensor<fp16, [1, 1280, 1, 1]> inputs_5_cast_fp16 = add(x = inputs_3_cast_fp16, y = obj_11_cast_fp16)[name = tensor<string, []>("inputs_5_cast_fp16")];
225 tensor<int32, [1]> out_5_axes_0 = const()[name = tensor<string, []>("out_5_axes_0"), val = tensor<int32, [1]>([1])];
226 tensor<fp16, []> var_321_to_fp16 = const()[name = tensor<string, []>("op_321_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
227 tensor<fp16, [1, 1280, 1, 1]> out_5_cast_fp16 = layer_norm(axes = out_5_axes_0, epsilon = var_321_to_fp16, x = inputs_5_cast_fp16)[name = tensor<string, []>("out_5_cast_fp16")];
228 tensor<fp16, [1280]> input_5_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_5_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(142554496)))];
229 tensor<fp16, [1280]> input_5_beta_0_to_fp16 = const()[name = tensor<string, []>("input_5_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(142557120)))];
230 tensor<fp16, []> input_5_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_5_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
231 tensor<fp16, [1, 1280, 1, 1]> input_5_cast_fp16 = batch_norm(beta = input_5_beta_0_to_fp16, epsilon = input_5_epsilon_0_to_fp16, gamma = input_5_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_5_cast_fp16)[name = tensor<string, []>("input_5_cast_fp16")];
232 tensor<string, []> var_339_pad_type_0 = const()[name = tensor<string, []>("op_339_pad_type_0"), val = tensor<string, []>("valid")];
233 tensor<int32, [2]> var_339_strides_0 = const()[name = tensor<string, []>("op_339_strides_0"), val = tensor<int32, [2]>([1, 1])];
234 tensor<int32, [4]> var_339_pad_0 = const()[name = tensor<string, []>("op_339_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
235 tensor<int32, [2]> var_339_dilations_0 = const()[name = tensor<string, []>("op_339_dilations_0"), val = tensor<int32, [2]>([1, 1])];
236 tensor<int32, []> var_339_groups_0 = const()[name = tensor<string, []>("op_339_groups_0"), val = tensor<int32, []>(1)];
237 tensor<fp16, [5120, 1280, 1, 1]> layers_0_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [3276800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(142559744))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(145836608))), name = tensor<string, []>("layers_0_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([5120, 1280, 1, 1])];
238 tensor<fp16, [5120]> layers_0_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [5120]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(145836736)))];
239 tensor<fp16, [1, 5120, 1, 1]> var_339_cast_fp16 = conv(bias = layers_0_fc1_inlier_module_bias_to_fp16, dilations = var_339_dilations_0, groups = var_339_groups_0, pad = var_339_pad_0, pad_type = var_339_pad_type_0, strides = var_339_strides_0, weight = layers_0_fc1_inlier_module_weight_to_fp16_palettized, x = input_5_cast_fp16)[name = tensor<string, []>("op_339_cast_fp16")];
240 tensor<string, []> var_345_pad_type_0 = const()[name = tensor<string, []>("op_345_pad_type_0"), val = tensor<string, []>("valid")];
241 tensor<int32, [2]> var_345_strides_0 = const()[name = tensor<string, []>("op_345_strides_0"), val = tensor<int32, [2]>([1, 1])];
242 tensor<int32, [4]> var_345_pad_0 = const()[name = tensor<string, []>("op_345_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
243 tensor<int32, [2]> var_345_dilations_0 = const()[name = tensor<string, []>("op_345_dilations_0"), val = tensor<int32, [2]>([1, 1])];
244 tensor<int32, []> var_345_groups_0 = const()[name = tensor<string, []>("op_345_groups_0"), val = tensor<int32, []>(1)];
245 tensor<fp16, [5120, 1280, 1, 1]> layers_0_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(145948608))), name = tensor<string, []>("layers_0_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [50752]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(145847040))), shape = tensor<uint32, [4]>([5120, 1280, 1, 1])];
246 tensor<fp16, [1, 5120, 1, 1]> var_345_cast_fp16 = conv(dilations = var_345_dilations_0, groups = var_345_groups_0, pad = var_345_pad_0, pad_type = var_345_pad_type_0, strides = var_345_strides_0, weight = layers_0_fc1_outlier_module_weight_to_fp16_sparsified, x = input_5_cast_fp16)[name = tensor<string, []>("op_345_cast_fp16")];
247 tensor<fp16, [1, 5120, 1, 1]> input_7_cast_fp16 = add(x = var_339_cast_fp16, y = var_345_cast_fp16)[name = tensor<string, []>("input_7_cast_fp16")];
248 tensor<string, []> input_9_mode_0 = const()[name = tensor<string, []>("input_9_mode_0"), val = tensor<string, []>("EXACT")];
249 tensor<fp16, [1, 5120, 1, 1]> input_9_cast_fp16 = gelu(mode = input_9_mode_0, x = input_7_cast_fp16)[name = tensor<string, []>("input_9_cast_fp16")];
250 tensor<string, []> var_356_pad_type_0 = const()[name = tensor<string, []>("op_356_pad_type_0"), val = tensor<string, []>("valid")];
251 tensor<int32, [2]> var_356_strides_0 = const()[name = tensor<string, []>("op_356_strides_0"), val = tensor<int32, [2]>([1, 1])];
252 tensor<int32, [4]> var_356_pad_0 = const()[name = tensor<string, []>("op_356_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
253 tensor<int32, [2]> var_356_dilations_0 = const()[name = tensor<string, []>("op_356_dilations_0"), val = tensor<int32, [2]>([1, 1])];
254 tensor<int32, []> var_356_groups_0 = const()[name = tensor<string, []>("op_356_groups_0"), val = tensor<int32, []>(1)];
255 tensor<fp16, [1280, 5120, 1, 1]> layers_0_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [3276800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(146767872))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(150044736))), name = tensor<string, []>("layers_0_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 5120, 1, 1])];
256 tensor<fp16, [1280]> layers_0_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(150044864)))];
257 tensor<fp16, [1, 1280, 1, 1]> var_356_cast_fp16 = conv(bias = layers_0_fc2_inlier_module_bias_to_fp16, dilations = var_356_dilations_0, groups = var_356_groups_0, pad = var_356_pad_0, pad_type = var_356_pad_type_0, strides = var_356_strides_0, weight = layers_0_fc2_inlier_module_weight_to_fp16_palettized, x = input_9_cast_fp16)[name = tensor<string, []>("op_356_cast_fp16")];
258 tensor<string, []> var_362_pad_type_0 = const()[name = tensor<string, []>("op_362_pad_type_0"), val = tensor<string, []>("valid")];
259 tensor<int32, [2]> var_362_strides_0 = const()[name = tensor<string, []>("op_362_strides_0"), val = tensor<int32, [2]>([1, 1])];
260 tensor<int32, [4]> var_362_pad_0 = const()[name = tensor<string, []>("op_362_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
261 tensor<int32, [2]> var_362_dilations_0 = const()[name = tensor<string, []>("op_362_dilations_0"), val = tensor<int32, [2]>([1, 1])];
262 tensor<int32, []> var_362_groups_0 = const()[name = tensor<string, []>("op_362_groups_0"), val = tensor<int32, []>(1)];
263 tensor<fp16, [1280, 5120, 1, 1]> layers_0_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(150230016))), name = tensor<string, []>("layers_0_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [91213]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(150047488))), shape = tensor<uint32, [4]>([1280, 5120, 1, 1])];
264 tensor<fp16, [1, 1280, 1, 1]> var_362_cast_fp16 = conv(dilations = var_362_dilations_0, groups = var_362_groups_0, pad = var_362_pad_0, pad_type = var_362_pad_type_0, strides = var_362_strides_0, weight = layers_0_fc2_outlier_module_weight_to_fp16_sparsified, x = input_9_cast_fp16)[name = tensor<string, []>("op_362_cast_fp16")];
265 tensor<fp16, [1, 1280, 1, 1]> hidden_states_3_cast_fp16 = add(x = var_356_cast_fp16, y = var_362_cast_fp16)[name = tensor<string, []>("hidden_states_3_cast_fp16")];
266 tensor<fp16, [1, 1280, 1, 1]> inputs_7_cast_fp16 = add(x = inputs_5_cast_fp16, y = hidden_states_3_cast_fp16)[name = tensor<string, []>("inputs_7_cast_fp16")];
267 tensor<int32, []> var_374 = const()[name = tensor<string, []>("op_374"), val = tensor<int32, []>(3)];
268 tensor<int32, [1]> out_7_axes_0 = const()[name = tensor<string, []>("out_7_axes_0"), val = tensor<int32, [1]>([1])];
269 tensor<fp16, []> var_400_to_fp16 = const()[name = tensor<string, []>("op_400_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
270 tensor<fp16, [1, 1280, 1, 1]> out_7_cast_fp16 = layer_norm(axes = out_7_axes_0, epsilon = var_400_to_fp16, x = inputs_7_cast_fp16)[name = tensor<string, []>("out_7_cast_fp16")];
271 tensor<fp16, [1280]> obj_15_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_15_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(151049280)))];
272 tensor<fp16, [1280]> obj_15_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_15_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(151051904)))];
273 tensor<fp16, []> obj_15_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_15_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
274 tensor<fp16, [1, 1280, 1, 1]> obj_15_cast_fp16 = batch_norm(beta = obj_15_beta_0_to_fp16, epsilon = obj_15_epsilon_0_to_fp16, gamma = obj_15_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_7_cast_fp16)[name = tensor<string, []>("obj_15_cast_fp16")];
275 tensor<string, []> var_422_pad_type_0 = const()[name = tensor<string, []>("op_422_pad_type_0"), val = tensor<string, []>("valid")];
276 tensor<int32, [2]> var_422_strides_0 = const()[name = tensor<string, []>("op_422_strides_0"), val = tensor<int32, [2]>([1, 1])];
277 tensor<int32, [4]> var_422_pad_0 = const()[name = tensor<string, []>("op_422_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
278 tensor<int32, [2]> var_422_dilations_0 = const()[name = tensor<string, []>("op_422_dilations_0"), val = tensor<int32, [2]>([1, 1])];
279 tensor<int32, []> var_422_groups_0 = const()[name = tensor<string, []>("op_422_groups_0"), val = tensor<int32, []>(1)];
280 tensor<fp16, [1280, 1280, 1, 1]> layers_1_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(151054528))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(151873792))), name = tensor<string, []>("layers_1_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
281 tensor<fp16, [1280]> layers_1_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(151873920)))];
282 tensor<fp16, [1, 1280, 1, 1]> var_422_cast_fp16 = conv(bias = layers_1_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_422_dilations_0, groups = var_422_groups_0, pad = var_422_pad_0, pad_type = var_422_pad_type_0, strides = var_422_strides_0, weight = layers_1_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_15_cast_fp16)[name = tensor<string, []>("op_422_cast_fp16")];
283 tensor<string, []> var_428_pad_type_0 = const()[name = tensor<string, []>("op_428_pad_type_0"), val = tensor<string, []>("valid")];
284 tensor<int32, [2]> var_428_strides_0 = const()[name = tensor<string, []>("op_428_strides_0"), val = tensor<int32, [2]>([1, 1])];
285 tensor<int32, [4]> var_428_pad_0 = const()[name = tensor<string, []>("op_428_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
286 tensor<int32, [2]> var_428_dilations_0 = const()[name = tensor<string, []>("op_428_dilations_0"), val = tensor<int32, [2]>([1, 1])];
287 tensor<int32, []> var_428_groups_0 = const()[name = tensor<string, []>("op_428_groups_0"), val = tensor<int32, []>(1)];
288 tensor<fp16, [1280, 1280, 1, 1]> layers_1_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(151936640))), name = tensor<string, []>("layers_1_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [29985]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(151876544))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
289 tensor<fp16, [1, 1280, 1, 1]> var_428_cast_fp16 = conv(dilations = var_428_dilations_0, groups = var_428_groups_0, pad = var_428_pad_0, pad_type = var_428_pad_type_0, strides = var_428_strides_0, weight = layers_1_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_15_cast_fp16)[name = tensor<string, []>("op_428_cast_fp16")];
290 tensor<fp16, [1, 1280, 1, 1]> query_5_cast_fp16 = add(x = var_422_cast_fp16, y = var_428_cast_fp16)[name = tensor<string, []>("query_5_cast_fp16")];
291 tensor<string, []> var_437_pad_type_0 = const()[name = tensor<string, []>("op_437_pad_type_0"), val = tensor<string, []>("valid")];
292 tensor<int32, [2]> var_437_strides_0 = const()[name = tensor<string, []>("op_437_strides_0"), val = tensor<int32, [2]>([1, 1])];
293 tensor<int32, [4]> var_437_pad_0 = const()[name = tensor<string, []>("op_437_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
294 tensor<int32, [2]> var_437_dilations_0 = const()[name = tensor<string, []>("op_437_dilations_0"), val = tensor<int32, [2]>([1, 1])];
295 tensor<int32, []> var_437_groups_0 = const()[name = tensor<string, []>("op_437_groups_0"), val = tensor<int32, []>(1)];
296 tensor<fp16, [1280, 1280, 1, 1]> layers_1_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(152141504))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(152960768))), name = tensor<string, []>("layers_1_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
297 tensor<fp16, [1, 1280, 1, 1]> var_437_cast_fp16 = conv(dilations = var_437_dilations_0, groups = var_437_groups_0, pad = var_437_pad_0, pad_type = var_437_pad_type_0, strides = var_437_strides_0, weight = layers_1_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_15_cast_fp16)[name = tensor<string, []>("op_437_cast_fp16")];
298 tensor<string, []> var_443_pad_type_0 = const()[name = tensor<string, []>("op_443_pad_type_0"), val = tensor<string, []>("valid")];
299 tensor<int32, [2]> var_443_strides_0 = const()[name = tensor<string, []>("op_443_strides_0"), val = tensor<int32, [2]>([1, 1])];
300 tensor<int32, [4]> var_443_pad_0 = const()[name = tensor<string, []>("op_443_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
301 tensor<int32, [2]> var_443_dilations_0 = const()[name = tensor<string, []>("op_443_dilations_0"), val = tensor<int32, [2]>([1, 1])];
302 tensor<int32, []> var_443_groups_0 = const()[name = tensor<string, []>("op_443_groups_0"), val = tensor<int32, []>(1)];
303 tensor<fp16, [1280, 1280, 1, 1]> layers_1_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(153007552))), name = tensor<string, []>("layers_1_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [23287]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(152960896))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
304 tensor<fp16, [1, 1280, 1, 1]> var_443_cast_fp16 = conv(dilations = var_443_dilations_0, groups = var_443_groups_0, pad = var_443_pad_0, pad_type = var_443_pad_type_0, strides = var_443_strides_0, weight = layers_1_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_15_cast_fp16)[name = tensor<string, []>("op_443_cast_fp16")];
305 tensor<fp16, [1, 1280, 1, 1]> current_key_3_cast_fp16 = add(x = var_437_cast_fp16, y = var_443_cast_fp16)[name = tensor<string, []>("current_key_3_cast_fp16")];
306 tensor<string, []> var_453_pad_type_0 = const()[name = tensor<string, []>("op_453_pad_type_0"), val = tensor<string, []>("valid")];
307 tensor<int32, [2]> var_453_strides_0 = const()[name = tensor<string, []>("op_453_strides_0"), val = tensor<int32, [2]>([1, 1])];
308 tensor<int32, [4]> var_453_pad_0 = const()[name = tensor<string, []>("op_453_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
309 tensor<int32, [2]> var_453_dilations_0 = const()[name = tensor<string, []>("op_453_dilations_0"), val = tensor<int32, [2]>([1, 1])];
310 tensor<int32, []> var_453_groups_0 = const()[name = tensor<string, []>("op_453_groups_0"), val = tensor<int32, []>(1)];
311 tensor<fp16, [1280, 1280, 1, 1]> layers_1_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(153212416))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(154031680))), name = tensor<string, []>("layers_1_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
312 tensor<fp16, [1280]> layers_1_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(154031808)))];
313 tensor<fp16, [1, 1280, 1, 1]> var_453_cast_fp16 = conv(bias = layers_1_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_453_dilations_0, groups = var_453_groups_0, pad = var_453_pad_0, pad_type = var_453_pad_type_0, strides = var_453_strides_0, weight = layers_1_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_15_cast_fp16)[name = tensor<string, []>("op_453_cast_fp16")];
314 tensor<string, []> var_459_pad_type_0 = const()[name = tensor<string, []>("op_459_pad_type_0"), val = tensor<string, []>("valid")];
315 tensor<int32, [2]> var_459_strides_0 = const()[name = tensor<string, []>("op_459_strides_0"), val = tensor<int32, [2]>([1, 1])];
316 tensor<int32, [4]> var_459_pad_0 = const()[name = tensor<string, []>("op_459_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
317 tensor<int32, [2]> var_459_dilations_0 = const()[name = tensor<string, []>("op_459_dilations_0"), val = tensor<int32, [2]>([1, 1])];
318 tensor<int32, []> var_459_groups_0 = const()[name = tensor<string, []>("op_459_groups_0"), val = tensor<int32, []>(1)];
319 tensor<fp16, [1280, 1280, 1, 1]> layers_1_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(154057088))), name = tensor<string, []>("layers_1_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [11267]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(154034432))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
320 tensor<fp16, [1, 1280, 1, 1]> var_459_cast_fp16 = conv(dilations = var_459_dilations_0, groups = var_459_groups_0, pad = var_459_pad_0, pad_type = var_459_pad_type_0, strides = var_459_strides_0, weight = layers_1_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_15_cast_fp16)[name = tensor<string, []>("op_459_cast_fp16")];
321 tensor<fp16, [1, 1280, 1, 1]> current_value_3_cast_fp16 = add(x = var_453_cast_fp16, y = var_459_cast_fp16)[name = tensor<string, []>("current_value_3_cast_fp16")];
322 tensor<fp16, [1, 1280, 1, 224]> var_465_cast_fp16 = mul(x = current_key_3_cast_fp16, y = var_159_cast_fp16)[name = tensor<string, []>("op_465_cast_fp16")];
323 tensor<fp16, [1, 1280, 1, 224]> var_467_cast_fp16 = mul(x = var_53_cast_fp16_1, y = var_162_cast_fp16)[name = tensor<string, []>("op_467_cast_fp16")];
324 tensor<fp16, [1, 1280, 1, 224]> key_5_cast_fp16 = add(x = var_465_cast_fp16, y = var_467_cast_fp16)[name = tensor<string, []>("key_5_cast_fp16")];
325 tensor<fp16, [1, 1280, 1, 224]> var_469_cast_fp16 = mul(x = current_value_3_cast_fp16, y = var_159_cast_fp16)[name = tensor<string, []>("op_469_cast_fp16")];
326 tensor<fp16, [1, 1280, 1, 224]> var_471_cast_fp16 = mul(x = var_60_cast_fp16_1, y = var_162_cast_fp16)[name = tensor<string, []>("op_471_cast_fp16")];
327 tensor<fp16, [1, 1280, 1, 224]> value_5_cast_fp16 = add(x = var_469_cast_fp16, y = var_471_cast_fp16)[name = tensor<string, []>("value_5_cast_fp16")];
328 tensor<int32, [4]> var_474 = const()[name = tensor<string, []>("op_474"), val = tensor<int32, [4]>([1, 20, 64, -1])];
329 tensor<fp16, [1, 20, 64, 1]> mh_q_5_cast_fp16 = reshape(shape = var_474, x = query_5_cast_fp16)[name = tensor<string, []>("mh_q_5_cast_fp16")];
330 tensor<fp16, []> var_476_to_fp16 = const()[name = tensor<string, []>("op_476_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
331 tensor<fp16, [1, 20, 64, 1]> var_477_cast_fp16 = mul(x = mh_q_5_cast_fp16, y = var_476_to_fp16)[name = tensor<string, []>("op_477_cast_fp16")];
332 tensor<int32, [4]> var_478 = const()[name = tensor<string, []>("op_478"), val = tensor<int32, [4]>([1, 20, 64, -1])];
333 tensor<fp16, [1, 20, 64, 224]> var_479_cast_fp16 = reshape(shape = var_478, x = key_5_cast_fp16)[name = tensor<string, []>("op_479_cast_fp16")];
334 tensor<bool, []> mh_w_7_transpose_x_0 = const()[name = tensor<string, []>("mh_w_7_transpose_x_0"), val = tensor<bool, []>(true)];
335 tensor<bool, []> mh_w_7_transpose_y_0 = const()[name = tensor<string, []>("mh_w_7_transpose_y_0"), val = tensor<bool, []>(false)];
336 tensor<fp16, [1, 20, 1, 224]> mh_w_7_cast_fp16 = matmul(transpose_x = mh_w_7_transpose_x_0, transpose_y = mh_w_7_transpose_y_0, x = var_477_cast_fp16, y = var_479_cast_fp16)[name = tensor<string, []>("mh_w_7_cast_fp16")];
337 tensor<fp16, [1, 20, 1, 224]> mh_w_9_cast_fp16 = add(x = mh_w_7_cast_fp16, y = var_180_cast_fp16)[name = tensor<string, []>("mh_w_9_cast_fp16")];
338 tensor<fp16, [1, 20, 1, 224]> var_487_cast_fp16 = softmax(axis = var_374, x = mh_w_9_cast_fp16)[name = tensor<string, []>("op_487_cast_fp16")];
339 tensor<int32, [4]> var_488 = const()[name = tensor<string, []>("op_488"), val = tensor<int32, [4]>([1, 20, 64, -1])];
340 tensor<fp16, [1, 20, 64, 224]> var_489_cast_fp16 = reshape(shape = var_488, x = value_5_cast_fp16)[name = tensor<string, []>("op_489_cast_fp16")];
341 tensor<bool, []> attn_5_transpose_x_0 = const()[name = tensor<string, []>("attn_5_transpose_x_0"), val = tensor<bool, []>(false)];
342 tensor<bool, []> attn_5_transpose_y_0 = const()[name = tensor<string, []>("attn_5_transpose_y_0"), val = tensor<bool, []>(true)];
343 tensor<fp16, [1, 20, 64, 1]> attn_5_cast_fp16 = matmul(transpose_x = attn_5_transpose_x_0, transpose_y = attn_5_transpose_y_0, x = var_489_cast_fp16, y = var_487_cast_fp16)[name = tensor<string, []>("attn_5_cast_fp16")];
344 tensor<int32, [4]> var_492 = const()[name = tensor<string, []>("op_492"), val = tensor<int32, [4]>([1, 1280, 1, -1])];
345 tensor<fp16, [1, 1280, 1, 1]> input_11_cast_fp16 = reshape(shape = var_492, x = attn_5_cast_fp16)[name = tensor<string, []>("input_11_cast_fp16")];
346 tensor<string, []> var_502_pad_type_0 = const()[name = tensor<string, []>("op_502_pad_type_0"), val = tensor<string, []>("valid")];
347 tensor<int32, [2]> var_502_strides_0 = const()[name = tensor<string, []>("op_502_strides_0"), val = tensor<int32, [2]>([1, 1])];
348 tensor<int32, [4]> var_502_pad_0 = const()[name = tensor<string, []>("op_502_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
349 tensor<int32, [2]> var_502_dilations_0 = const()[name = tensor<string, []>("op_502_dilations_0"), val = tensor<int32, [2]>([1, 1])];
350 tensor<int32, []> var_502_groups_0 = const()[name = tensor<string, []>("op_502_groups_0"), val = tensor<int32, []>(1)];
351 tensor<fp16, [1280, 1280, 1, 1]> layers_1_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(154261952))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(155081216))), name = tensor<string, []>("layers_1_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
352 tensor<fp16, [1280]> layers_1_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(155081344)))];
353 tensor<fp16, [1, 1280, 1, 1]> var_502_cast_fp16 = conv(bias = layers_1_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_502_dilations_0, groups = var_502_groups_0, pad = var_502_pad_0, pad_type = var_502_pad_type_0, strides = var_502_strides_0, weight = layers_1_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_11_cast_fp16)[name = tensor<string, []>("op_502_cast_fp16")];
354 tensor<string, []> var_508_pad_type_0 = const()[name = tensor<string, []>("op_508_pad_type_0"), val = tensor<string, []>("valid")];
355 tensor<int32, [2]> var_508_strides_0 = const()[name = tensor<string, []>("op_508_strides_0"), val = tensor<int32, [2]>([1, 1])];
356 tensor<int32, [4]> var_508_pad_0 = const()[name = tensor<string, []>("op_508_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
357 tensor<int32, [2]> var_508_dilations_0 = const()[name = tensor<string, []>("op_508_dilations_0"), val = tensor<int32, [2]>([1, 1])];
358 tensor<int32, []> var_508_groups_0 = const()[name = tensor<string, []>("op_508_groups_0"), val = tensor<int32, []>(1)];
359 tensor<fp16, [1280, 1280, 1, 1]> layers_1_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(155108416))), name = tensor<string, []>("layers_1_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [12187]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(155083968))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
360 tensor<fp16, [1, 1280, 1, 1]> var_508_cast_fp16 = conv(dilations = var_508_dilations_0, groups = var_508_groups_0, pad = var_508_pad_0, pad_type = var_508_pad_type_0, strides = var_508_strides_0, weight = layers_1_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_11_cast_fp16)[name = tensor<string, []>("op_508_cast_fp16")];
361 tensor<fp16, [1, 1280, 1, 1]> obj_21_cast_fp16 = add(x = var_502_cast_fp16, y = var_508_cast_fp16)[name = tensor<string, []>("obj_21_cast_fp16")];
362 tensor<fp16, [1, 1280, 1, 1]> inputs_9_cast_fp16 = add(x = inputs_7_cast_fp16, y = obj_21_cast_fp16)[name = tensor<string, []>("inputs_9_cast_fp16")];
363 tensor<int32, [1]> out_9_axes_0 = const()[name = tensor<string, []>("out_9_axes_0"), val = tensor<int32, [1]>([1])];
364 tensor<fp16, []> var_523_to_fp16 = const()[name = tensor<string, []>("op_523_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
365 tensor<fp16, [1, 1280, 1, 1]> out_9_cast_fp16 = layer_norm(axes = out_9_axes_0, epsilon = var_523_to_fp16, x = inputs_9_cast_fp16)[name = tensor<string, []>("out_9_cast_fp16")];
366 tensor<fp16, [1280]> obj_23_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_23_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(155313280)))];
367 tensor<fp16, [1280]> obj_23_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_23_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(155315904)))];
368 tensor<fp16, []> obj_23_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_23_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
369 tensor<fp16, [1, 1280, 1, 1]> obj_23_cast_fp16 = batch_norm(beta = obj_23_beta_0_to_fp16, epsilon = obj_23_epsilon_0_to_fp16, gamma = obj_23_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_9_cast_fp16)[name = tensor<string, []>("obj_23_cast_fp16")];
370 tensor<string, []> var_545_pad_type_0 = const()[name = tensor<string, []>("op_545_pad_type_0"), val = tensor<string, []>("valid")];
371 tensor<int32, [2]> var_545_strides_0 = const()[name = tensor<string, []>("op_545_strides_0"), val = tensor<int32, [2]>([1, 1])];
372 tensor<int32, [4]> var_545_pad_0 = const()[name = tensor<string, []>("op_545_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
373 tensor<int32, [2]> var_545_dilations_0 = const()[name = tensor<string, []>("op_545_dilations_0"), val = tensor<int32, [2]>([1, 1])];
374 tensor<int32, []> var_545_groups_0 = const()[name = tensor<string, []>("op_545_groups_0"), val = tensor<int32, []>(1)];
375 tensor<fp16, [1280, 1280, 1, 1]> layers_1_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(155318528))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(156137792))), name = tensor<string, []>("layers_1_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
376 tensor<fp16, [1280]> layers_1_encoder_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_encoder_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(156137920)))];
377 tensor<fp16, [1, 1280, 1, 1]> var_545_cast_fp16 = conv(bias = layers_1_encoder_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_545_dilations_0, groups = var_545_groups_0, pad = var_545_pad_0, pad_type = var_545_pad_type_0, strides = var_545_strides_0, weight = layers_1_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_23_cast_fp16)[name = tensor<string, []>("op_545_cast_fp16")];
378 tensor<string, []> var_551_pad_type_0 = const()[name = tensor<string, []>("op_551_pad_type_0"), val = tensor<string, []>("valid")];
379 tensor<int32, [2]> var_551_strides_0 = const()[name = tensor<string, []>("op_551_strides_0"), val = tensor<int32, [2]>([1, 1])];
380 tensor<int32, [4]> var_551_pad_0 = const()[name = tensor<string, []>("op_551_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
381 tensor<int32, [2]> var_551_dilations_0 = const()[name = tensor<string, []>("op_551_dilations_0"), val = tensor<int32, [2]>([1, 1])];
382 tensor<int32, []> var_551_groups_0 = const()[name = tensor<string, []>("op_551_groups_0"), val = tensor<int32, []>(1)];
383 tensor<fp16, [1280, 1280, 1, 1]> layers_1_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(156183616))), name = tensor<string, []>("layers_1_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [21483]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(156140544))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
384 tensor<fp16, [1, 1280, 1, 1]> var_551_cast_fp16 = conv(dilations = var_551_dilations_0, groups = var_551_groups_0, pad = var_551_pad_0, pad_type = var_551_pad_type_0, strides = var_551_strides_0, weight = layers_1_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_23_cast_fp16)[name = tensor<string, []>("op_551_cast_fp16")];
385 tensor<fp16, [1, 1280, 1, 1]> query_7_cast_fp16 = add(x = var_545_cast_fp16, y = var_551_cast_fp16)[name = tensor<string, []>("query_7_cast_fp16")];
386 tensor<string, []> var_560_pad_type_0 = const()[name = tensor<string, []>("op_560_pad_type_0"), val = tensor<string, []>("valid")];
387 tensor<int32, [2]> var_560_strides_0 = const()[name = tensor<string, []>("op_560_strides_0"), val = tensor<int32, [2]>([1, 1])];
388 tensor<int32, [4]> var_560_pad_0 = const()[name = tensor<string, []>("op_560_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
389 tensor<int32, [2]> var_560_dilations_0 = const()[name = tensor<string, []>("op_560_dilations_0"), val = tensor<int32, [2]>([1, 1])];
390 tensor<int32, []> var_560_groups_0 = const()[name = tensor<string, []>("op_560_groups_0"), val = tensor<int32, []>(1)];
391 tensor<fp16, [1280, 1280, 1, 1]> layers_1_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(156388480))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(157207744))), name = tensor<string, []>("layers_1_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
392 tensor<fp16, [1, 1280, 1, 1500]> var_560_cast_fp16 = conv(dilations = var_560_dilations_0, groups = var_560_groups_0, pad = var_560_pad_0, pad_type = var_560_pad_type_0, strides = var_560_strides_0, weight = layers_1_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor<string, []>("op_560_cast_fp16")];
393 tensor<string, []> var_566_pad_type_0 = const()[name = tensor<string, []>("op_566_pad_type_0"), val = tensor<string, []>("valid")];
394 tensor<int32, [2]> var_566_strides_0 = const()[name = tensor<string, []>("op_566_strides_0"), val = tensor<int32, [2]>([1, 1])];
395 tensor<int32, [4]> var_566_pad_0 = const()[name = tensor<string, []>("op_566_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
396 tensor<int32, [2]> var_566_dilations_0 = const()[name = tensor<string, []>("op_566_dilations_0"), val = tensor<int32, [2]>([1, 1])];
397 tensor<int32, []> var_566_groups_0 = const()[name = tensor<string, []>("op_566_groups_0"), val = tensor<int32, []>(1)];
398 tensor<fp16, [1280, 1280, 1, 1]> layers_1_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(157251328))), name = tensor<string, []>("layers_1_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [21667]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(157207872))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
399 tensor<fp16, [1, 1280, 1, 1500]> var_566_cast_fp16 = conv(dilations = var_566_dilations_0, groups = var_566_groups_0, pad = var_566_pad_0, pad_type = var_566_pad_type_0, strides = var_566_strides_0, weight = layers_1_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = encoder_output_embeds)[name = tensor<string, []>("op_566_cast_fp16")];
400 tensor<fp16, [1, 1280, 1, 1500]> key_7_cast_fp16 = add(x = var_560_cast_fp16, y = var_566_cast_fp16)[name = tensor<string, []>("key_7_cast_fp16")];
401 tensor<string, []> var_576_pad_type_0 = const()[name = tensor<string, []>("op_576_pad_type_0"), val = tensor<string, []>("valid")];
402 tensor<int32, [2]> var_576_strides_0 = const()[name = tensor<string, []>("op_576_strides_0"), val = tensor<int32, [2]>([1, 1])];
403 tensor<int32, [4]> var_576_pad_0 = const()[name = tensor<string, []>("op_576_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
404 tensor<int32, [2]> var_576_dilations_0 = const()[name = tensor<string, []>("op_576_dilations_0"), val = tensor<int32, [2]>([1, 1])];
405 tensor<int32, []> var_576_groups_0 = const()[name = tensor<string, []>("op_576_groups_0"), val = tensor<int32, []>(1)];
406 tensor<fp16, [1280, 1280, 1, 1]> layers_1_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(157456192))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(158275456))), name = tensor<string, []>("layers_1_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
407 tensor<fp16, [1280]> layers_1_encoder_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_encoder_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(158275584)))];
408 tensor<fp16, [1, 1280, 1, 1500]> var_576_cast_fp16 = conv(bias = layers_1_encoder_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_576_dilations_0, groups = var_576_groups_0, pad = var_576_pad_0, pad_type = var_576_pad_type_0, strides = var_576_strides_0, weight = layers_1_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor<string, []>("op_576_cast_fp16")];
409 tensor<string, []> var_582_pad_type_0 = const()[name = tensor<string, []>("op_582_pad_type_0"), val = tensor<string, []>("valid")];
410 tensor<int32, [2]> var_582_strides_0 = const()[name = tensor<string, []>("op_582_strides_0"), val = tensor<int32, [2]>([1, 1])];
411 tensor<int32, [4]> var_582_pad_0 = const()[name = tensor<string, []>("op_582_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
412 tensor<int32, [2]> var_582_dilations_0 = const()[name = tensor<string, []>("op_582_dilations_0"), val = tensor<int32, [2]>([1, 1])];
413 tensor<int32, []> var_582_groups_0 = const()[name = tensor<string, []>("op_582_groups_0"), val = tensor<int32, []>(1)];
414 tensor<fp16, [1280, 1280, 1, 1]> layers_1_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(158289408))), name = tensor<string, []>("layers_1_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5557]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(158278208))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
415 tensor<fp16, [1, 1280, 1, 1500]> var_582_cast_fp16 = conv(dilations = var_582_dilations_0, groups = var_582_groups_0, pad = var_582_pad_0, pad_type = var_582_pad_type_0, strides = var_582_strides_0, weight = layers_1_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = encoder_output_embeds)[name = tensor<string, []>("op_582_cast_fp16")];
416 tensor<fp16, [1, 1280, 1, 1500]> value_7_cast_fp16 = add(x = var_576_cast_fp16, y = var_582_cast_fp16)[name = tensor<string, []>("value_7_cast_fp16")];
417 tensor<int32, [4]> var_585 = const()[name = tensor<string, []>("op_585"), val = tensor<int32, [4]>([1, 20, 64, -1])];
418 tensor<fp16, [1, 20, 64, 1]> mh_q_7_cast_fp16 = reshape(shape = var_585, x = query_7_cast_fp16)[name = tensor<string, []>("mh_q_7_cast_fp16")];
419 tensor<fp16, []> var_587_to_fp16 = const()[name = tensor<string, []>("op_587_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
420 tensor<fp16, [1, 20, 64, 1]> var_588_cast_fp16 = mul(x = mh_q_7_cast_fp16, y = var_587_to_fp16)[name = tensor<string, []>("op_588_cast_fp16")];
421 tensor<int32, [4]> var_589 = const()[name = tensor<string, []>("op_589"), val = tensor<int32, [4]>([1, 20, 64, -1])];
422 tensor<fp16, [1, 20, 64, 1500]> var_590_cast_fp16 = reshape(shape = var_589, x = key_7_cast_fp16)[name = tensor<string, []>("op_590_cast_fp16")];
423 tensor<bool, []> mh_w_11_transpose_x_0 = const()[name = tensor<string, []>("mh_w_11_transpose_x_0"), val = tensor<bool, []>(true)];
424 tensor<bool, []> mh_w_11_transpose_y_0 = const()[name = tensor<string, []>("mh_w_11_transpose_y_0"), val = tensor<bool, []>(false)];
425 tensor<fp16, [1, 20, 1, 1500]> mh_w_11_cast_fp16 = matmul(transpose_x = mh_w_11_transpose_x_0, transpose_y = mh_w_11_transpose_y_0, x = var_588_cast_fp16, y = var_590_cast_fp16)[name = tensor<string, []>("mh_w_11_cast_fp16")];
426 tensor<fp16, [1, 20, 1, 1500]> obj_27_cast_fp16 = softmax(axis = var_374, x = mh_w_11_cast_fp16)[name = tensor<string, []>("obj_27_cast_fp16")];
427 tensor<int32, [4]> var_594 = const()[name = tensor<string, []>("op_594"), val = tensor<int32, [4]>([1, 20, 64, -1])];
428 tensor<fp16, [1, 20, 64, 1500]> var_595_cast_fp16 = reshape(shape = var_594, x = value_7_cast_fp16)[name = tensor<string, []>("op_595_cast_fp16")];
429 tensor<bool, []> attn_7_transpose_x_0 = const()[name = tensor<string, []>("attn_7_transpose_x_0"), val = tensor<bool, []>(false)];
430 tensor<bool, []> attn_7_transpose_y_0 = const()[name = tensor<string, []>("attn_7_transpose_y_0"), val = tensor<bool, []>(true)];
431 tensor<fp16, [1, 20, 64, 1]> attn_7_cast_fp16 = matmul(transpose_x = attn_7_transpose_x_0, transpose_y = attn_7_transpose_y_0, x = var_595_cast_fp16, y = obj_27_cast_fp16)[name = tensor<string, []>("attn_7_cast_fp16")];
432 tensor<int32, [4]> var_598 = const()[name = tensor<string, []>("op_598"), val = tensor<int32, [4]>([1, 1280, 1, -1])];
433 tensor<fp16, [1, 1280, 1, 1]> input_13_cast_fp16 = reshape(shape = var_598, x = attn_7_cast_fp16)[name = tensor<string, []>("input_13_cast_fp16")];
434 tensor<string, []> var_608_pad_type_0 = const()[name = tensor<string, []>("op_608_pad_type_0"), val = tensor<string, []>("valid")];
435 tensor<int32, [2]> var_608_strides_0 = const()[name = tensor<string, []>("op_608_strides_0"), val = tensor<int32, [2]>([1, 1])];
436 tensor<int32, [4]> var_608_pad_0 = const()[name = tensor<string, []>("op_608_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
437 tensor<int32, [2]> var_608_dilations_0 = const()[name = tensor<string, []>("op_608_dilations_0"), val = tensor<int32, [2]>([1, 1])];
438 tensor<int32, []> var_608_groups_0 = const()[name = tensor<string, []>("op_608_groups_0"), val = tensor<int32, []>(1)];
439 tensor<fp16, [1280, 1280, 1, 1]> layers_1_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(158494272))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(159313536))), name = tensor<string, []>("layers_1_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
440 tensor<fp16, [1280]> layers_1_encoder_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_encoder_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(159313664)))];
441 tensor<fp16, [1, 1280, 1, 1]> var_608_cast_fp16 = conv(bias = layers_1_encoder_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_608_dilations_0, groups = var_608_groups_0, pad = var_608_pad_0, pad_type = var_608_pad_type_0, strides = var_608_strides_0, weight = layers_1_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_13_cast_fp16)[name = tensor<string, []>("op_608_cast_fp16")];
442 tensor<string, []> var_614_pad_type_0 = const()[name = tensor<string, []>("op_614_pad_type_0"), val = tensor<string, []>("valid")];
443 tensor<int32, [2]> var_614_strides_0 = const()[name = tensor<string, []>("op_614_strides_0"), val = tensor<int32, [2]>([1, 1])];
444 tensor<int32, [4]> var_614_pad_0 = const()[name = tensor<string, []>("op_614_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
445 tensor<int32, [2]> var_614_dilations_0 = const()[name = tensor<string, []>("op_614_dilations_0"), val = tensor<int32, [2]>([1, 1])];
446 tensor<int32, []> var_614_groups_0 = const()[name = tensor<string, []>("op_614_groups_0"), val = tensor<int32, []>(1)];
447 tensor<fp16, [1280, 1280, 1, 1]> layers_1_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(159326656))), name = tensor<string, []>("layers_1_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5143]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(159316288))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
448 tensor<fp16, [1, 1280, 1, 1]> var_614_cast_fp16 = conv(dilations = var_614_dilations_0, groups = var_614_groups_0, pad = var_614_pad_0, pad_type = var_614_pad_type_0, strides = var_614_strides_0, weight = layers_1_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_13_cast_fp16)[name = tensor<string, []>("op_614_cast_fp16")];
449 tensor<fp16, [1, 1280, 1, 1]> obj_25_cast_fp16 = add(x = var_608_cast_fp16, y = var_614_cast_fp16)[name = tensor<string, []>("obj_25_cast_fp16")];
450 tensor<fp16, [1, 1280, 1, 1]> inputs_11_cast_fp16 = add(x = inputs_9_cast_fp16, y = obj_25_cast_fp16)[name = tensor<string, []>("inputs_11_cast_fp16")];
451 tensor<int32, [1]> out_11_axes_0 = const()[name = tensor<string, []>("out_11_axes_0"), val = tensor<int32, [1]>([1])];
452 tensor<fp16, []> var_625_to_fp16 = const()[name = tensor<string, []>("op_625_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
453 tensor<fp16, [1, 1280, 1, 1]> out_11_cast_fp16 = layer_norm(axes = out_11_axes_0, epsilon = var_625_to_fp16, x = inputs_11_cast_fp16)[name = tensor<string, []>("out_11_cast_fp16")];
454 tensor<fp16, [1280]> input_15_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_15_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(159531520)))];
455 tensor<fp16, [1280]> input_15_beta_0_to_fp16 = const()[name = tensor<string, []>("input_15_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(159534144)))];
456 tensor<fp16, []> input_15_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_15_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
457 tensor<fp16, [1, 1280, 1, 1]> input_15_cast_fp16 = batch_norm(beta = input_15_beta_0_to_fp16, epsilon = input_15_epsilon_0_to_fp16, gamma = input_15_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_11_cast_fp16)[name = tensor<string, []>("input_15_cast_fp16")];
458 tensor<string, []> var_643_pad_type_0 = const()[name = tensor<string, []>("op_643_pad_type_0"), val = tensor<string, []>("valid")];
459 tensor<int32, [2]> var_643_strides_0 = const()[name = tensor<string, []>("op_643_strides_0"), val = tensor<int32, [2]>([1, 1])];
460 tensor<int32, [4]> var_643_pad_0 = const()[name = tensor<string, []>("op_643_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
461 tensor<int32, [2]> var_643_dilations_0 = const()[name = tensor<string, []>("op_643_dilations_0"), val = tensor<int32, [2]>([1, 1])];
462 tensor<int32, []> var_643_groups_0 = const()[name = tensor<string, []>("op_643_groups_0"), val = tensor<int32, []>(1)];
463 tensor<fp16, [5120, 1280, 1, 1]> layers_1_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [3276800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(159536768))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(162813632))), name = tensor<string, []>("layers_1_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([5120, 1280, 1, 1])];
464 tensor<fp16, [5120]> layers_1_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [5120]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(162813760)))];
465 tensor<fp16, [1, 5120, 1, 1]> var_643_cast_fp16 = conv(bias = layers_1_fc1_inlier_module_bias_to_fp16, dilations = var_643_dilations_0, groups = var_643_groups_0, pad = var_643_pad_0, pad_type = var_643_pad_type_0, strides = var_643_strides_0, weight = layers_1_fc1_inlier_module_weight_to_fp16_palettized, x = input_15_cast_fp16)[name = tensor<string, []>("op_643_cast_fp16")];
466 tensor<string, []> var_649_pad_type_0 = const()[name = tensor<string, []>("op_649_pad_type_0"), val = tensor<string, []>("valid")];
467 tensor<int32, [2]> var_649_strides_0 = const()[name = tensor<string, []>("op_649_strides_0"), val = tensor<int32, [2]>([1, 1])];
468 tensor<int32, [4]> var_649_pad_0 = const()[name = tensor<string, []>("op_649_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
469 tensor<int32, [2]> var_649_dilations_0 = const()[name = tensor<string, []>("op_649_dilations_0"), val = tensor<int32, [2]>([1, 1])];
470 tensor<int32, []> var_649_groups_0 = const()[name = tensor<string, []>("op_649_groups_0"), val = tensor<int32, []>(1)];
471 tensor<fp16, [5120, 1280, 1, 1]> layers_1_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(162909312))), name = tensor<string, []>("layers_1_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [42562]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(162824064))), shape = tensor<uint32, [4]>([5120, 1280, 1, 1])];
472 tensor<fp16, [1, 5120, 1, 1]> var_649_cast_fp16 = conv(dilations = var_649_dilations_0, groups = var_649_groups_0, pad = var_649_pad_0, pad_type = var_649_pad_type_0, strides = var_649_strides_0, weight = layers_1_fc1_outlier_module_weight_to_fp16_sparsified, x = input_15_cast_fp16)[name = tensor<string, []>("op_649_cast_fp16")];
473 tensor<fp16, [1, 5120, 1, 1]> input_17_cast_fp16 = add(x = var_643_cast_fp16, y = var_649_cast_fp16)[name = tensor<string, []>("input_17_cast_fp16")];
474 tensor<string, []> input_19_mode_0 = const()[name = tensor<string, []>("input_19_mode_0"), val = tensor<string, []>("EXACT")];
475 tensor<fp16, [1, 5120, 1, 1]> input_19_cast_fp16 = gelu(mode = input_19_mode_0, x = input_17_cast_fp16)[name = tensor<string, []>("input_19_cast_fp16")];
476 tensor<string, []> var_660_pad_type_0 = const()[name = tensor<string, []>("op_660_pad_type_0"), val = tensor<string, []>("valid")];
477 tensor<int32, [2]> var_660_strides_0 = const()[name = tensor<string, []>("op_660_strides_0"), val = tensor<int32, [2]>([1, 1])];
478 tensor<int32, [4]> var_660_pad_0 = const()[name = tensor<string, []>("op_660_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
479 tensor<int32, [2]> var_660_dilations_0 = const()[name = tensor<string, []>("op_660_dilations_0"), val = tensor<int32, [2]>([1, 1])];
480 tensor<int32, []> var_660_groups_0 = const()[name = tensor<string, []>("op_660_groups_0"), val = tensor<int32, []>(1)];
481 tensor<fp16, [1280, 5120, 1, 1]> layers_1_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [3276800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(163728576))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(167005440))), name = tensor<string, []>("layers_1_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 5120, 1, 1])];
482 tensor<fp16, [1280]> layers_1_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(167005568)))];
483 tensor<fp16, [1, 1280, 1, 1]> var_660_cast_fp16 = conv(bias = layers_1_fc2_inlier_module_bias_to_fp16, dilations = var_660_dilations_0, groups = var_660_groups_0, pad = var_660_pad_0, pad_type = var_660_pad_type_0, strides = var_660_strides_0, weight = layers_1_fc2_inlier_module_weight_to_fp16_palettized, x = input_19_cast_fp16)[name = tensor<string, []>("op_660_cast_fp16")];
484 tensor<string, []> var_666_pad_type_0 = const()[name = tensor<string, []>("op_666_pad_type_0"), val = tensor<string, []>("valid")];
485 tensor<int32, [2]> var_666_strides_0 = const()[name = tensor<string, []>("op_666_strides_0"), val = tensor<int32, [2]>([1, 1])];
486 tensor<int32, [4]> var_666_pad_0 = const()[name = tensor<string, []>("op_666_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
487 tensor<int32, [2]> var_666_dilations_0 = const()[name = tensor<string, []>("op_666_dilations_0"), val = tensor<int32, [2]>([1, 1])];
488 tensor<int32, []> var_666_groups_0 = const()[name = tensor<string, []>("op_666_groups_0"), val = tensor<int32, []>(1)];
489 tensor<fp16, [1280, 5120, 1, 1]> layers_1_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(167096192))), name = tensor<string, []>("layers_1_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [43939]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(167008192))), shape = tensor<uint32, [4]>([1280, 5120, 1, 1])];
490 tensor<fp16, [1, 1280, 1, 1]> var_666_cast_fp16 = conv(dilations = var_666_dilations_0, groups = var_666_groups_0, pad = var_666_pad_0, pad_type = var_666_pad_type_0, strides = var_666_strides_0, weight = layers_1_fc2_outlier_module_weight_to_fp16_sparsified, x = input_19_cast_fp16)[name = tensor<string, []>("op_666_cast_fp16")];
491 tensor<fp16, [1, 1280, 1, 1]> hidden_states_5_cast_fp16 = add(x = var_660_cast_fp16, y = var_666_cast_fp16)[name = tensor<string, []>("hidden_states_5_cast_fp16")];
492 tensor<fp16, [1, 1280, 1, 1]> inputs_13_cast_fp16 = add(x = inputs_11_cast_fp16, y = hidden_states_5_cast_fp16)[name = tensor<string, []>("inputs_13_cast_fp16")];
493 tensor<int32, []> var_678 = const()[name = tensor<string, []>("op_678"), val = tensor<int32, []>(3)];
494 tensor<int32, [1]> out_13_axes_0 = const()[name = tensor<string, []>("out_13_axes_0"), val = tensor<int32, [1]>([1])];
495 tensor<fp16, []> var_704_to_fp16 = const()[name = tensor<string, []>("op_704_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
496 tensor<fp16, [1, 1280, 1, 1]> out_13_cast_fp16 = layer_norm(axes = out_13_axes_0, epsilon = var_704_to_fp16, x = inputs_13_cast_fp16)[name = tensor<string, []>("out_13_cast_fp16")];
497 tensor<fp16, [1280]> obj_29_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_29_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(167915456)))];
498 tensor<fp16, [1280]> obj_29_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_29_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(167918080)))];
499 tensor<fp16, []> obj_29_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_29_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
500 tensor<fp16, [1, 1280, 1, 1]> obj_29_cast_fp16 = batch_norm(beta = obj_29_beta_0_to_fp16, epsilon = obj_29_epsilon_0_to_fp16, gamma = obj_29_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_13_cast_fp16)[name = tensor<string, []>("obj_29_cast_fp16")];
501 tensor<string, []> var_726_pad_type_0 = const()[name = tensor<string, []>("op_726_pad_type_0"), val = tensor<string, []>("valid")];
502 tensor<int32, [2]> var_726_strides_0 = const()[name = tensor<string, []>("op_726_strides_0"), val = tensor<int32, [2]>([1, 1])];
503 tensor<int32, [4]> var_726_pad_0 = const()[name = tensor<string, []>("op_726_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
504 tensor<int32, [2]> var_726_dilations_0 = const()[name = tensor<string, []>("op_726_dilations_0"), val = tensor<int32, [2]>([1, 1])];
505 tensor<int32, []> var_726_groups_0 = const()[name = tensor<string, []>("op_726_groups_0"), val = tensor<int32, []>(1)];
506 tensor<fp16, [1280, 1280, 1, 1]> layers_2_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(167920704))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(168739968))), name = tensor<string, []>("layers_2_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
507 tensor<fp16, [1280]> layers_2_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(168740096)))];
508 tensor<fp16, [1, 1280, 1, 1]> var_726_cast_fp16 = conv(bias = layers_2_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_726_dilations_0, groups = var_726_groups_0, pad = var_726_pad_0, pad_type = var_726_pad_type_0, strides = var_726_strides_0, weight = layers_2_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_29_cast_fp16)[name = tensor<string, []>("op_726_cast_fp16")];
509 tensor<string, []> var_732_pad_type_0 = const()[name = tensor<string, []>("op_732_pad_type_0"), val = tensor<string, []>("valid")];
510 tensor<int32, [2]> var_732_strides_0 = const()[name = tensor<string, []>("op_732_strides_0"), val = tensor<int32, [2]>([1, 1])];
511 tensor<int32, [4]> var_732_pad_0 = const()[name = tensor<string, []>("op_732_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
512 tensor<int32, [2]> var_732_dilations_0 = const()[name = tensor<string, []>("op_732_dilations_0"), val = tensor<int32, [2]>([1, 1])];
513 tensor<int32, []> var_732_groups_0 = const()[name = tensor<string, []>("op_732_groups_0"), val = tensor<int32, []>(1)];
514 tensor<fp16, [1280, 1280, 1, 1]> layers_2_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(168774976))), name = tensor<string, []>("layers_2_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [16094]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(168742720))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
515 tensor<fp16, [1, 1280, 1, 1]> var_732_cast_fp16 = conv(dilations = var_732_dilations_0, groups = var_732_groups_0, pad = var_732_pad_0, pad_type = var_732_pad_type_0, strides = var_732_strides_0, weight = layers_2_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_29_cast_fp16)[name = tensor<string, []>("op_732_cast_fp16")];
516 tensor<fp16, [1, 1280, 1, 1]> query_9_cast_fp16 = add(x = var_726_cast_fp16, y = var_732_cast_fp16)[name = tensor<string, []>("query_9_cast_fp16")];
517 tensor<string, []> var_741_pad_type_0 = const()[name = tensor<string, []>("op_741_pad_type_0"), val = tensor<string, []>("valid")];
518 tensor<int32, [2]> var_741_strides_0 = const()[name = tensor<string, []>("op_741_strides_0"), val = tensor<int32, [2]>([1, 1])];
519 tensor<int32, [4]> var_741_pad_0 = const()[name = tensor<string, []>("op_741_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
520 tensor<int32, [2]> var_741_dilations_0 = const()[name = tensor<string, []>("op_741_dilations_0"), val = tensor<int32, [2]>([1, 1])];
521 tensor<int32, []> var_741_groups_0 = const()[name = tensor<string, []>("op_741_groups_0"), val = tensor<int32, []>(1)];
522 tensor<fp16, [1280, 1280, 1, 1]> layers_2_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(168979840))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(169799104))), name = tensor<string, []>("layers_2_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
523 tensor<fp16, [1, 1280, 1, 1]> var_741_cast_fp16 = conv(dilations = var_741_dilations_0, groups = var_741_groups_0, pad = var_741_pad_0, pad_type = var_741_pad_type_0, strides = var_741_strides_0, weight = layers_2_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_29_cast_fp16)[name = tensor<string, []>("op_741_cast_fp16")];
524 tensor<string, []> var_747_pad_type_0 = const()[name = tensor<string, []>("op_747_pad_type_0"), val = tensor<string, []>("valid")];
525 tensor<int32, [2]> var_747_strides_0 = const()[name = tensor<string, []>("op_747_strides_0"), val = tensor<int32, [2]>([1, 1])];
526 tensor<int32, [4]> var_747_pad_0 = const()[name = tensor<string, []>("op_747_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
527 tensor<int32, [2]> var_747_dilations_0 = const()[name = tensor<string, []>("op_747_dilations_0"), val = tensor<int32, [2]>([1, 1])];
528 tensor<int32, []> var_747_groups_0 = const()[name = tensor<string, []>("op_747_groups_0"), val = tensor<int32, []>(1)];
529 tensor<fp16, [1280, 1280, 1, 1]> layers_2_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(169836736))), name = tensor<string, []>("layers_2_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [18690]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(169799232))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
530 tensor<fp16, [1, 1280, 1, 1]> var_747_cast_fp16 = conv(dilations = var_747_dilations_0, groups = var_747_groups_0, pad = var_747_pad_0, pad_type = var_747_pad_type_0, strides = var_747_strides_0, weight = layers_2_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_29_cast_fp16)[name = tensor<string, []>("op_747_cast_fp16")];
531 tensor<fp16, [1, 1280, 1, 1]> current_key_5_cast_fp16 = add(x = var_741_cast_fp16, y = var_747_cast_fp16)[name = tensor<string, []>("current_key_5_cast_fp16")];
532 tensor<string, []> var_757_pad_type_0 = const()[name = tensor<string, []>("op_757_pad_type_0"), val = tensor<string, []>("valid")];
533 tensor<int32, [2]> var_757_strides_0 = const()[name = tensor<string, []>("op_757_strides_0"), val = tensor<int32, [2]>([1, 1])];
534 tensor<int32, [4]> var_757_pad_0 = const()[name = tensor<string, []>("op_757_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
535 tensor<int32, [2]> var_757_dilations_0 = const()[name = tensor<string, []>("op_757_dilations_0"), val = tensor<int32, [2]>([1, 1])];
536 tensor<int32, []> var_757_groups_0 = const()[name = tensor<string, []>("op_757_groups_0"), val = tensor<int32, []>(1)];
537 tensor<fp16, [1280, 1280, 1, 1]> layers_2_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(170041600))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(170860864))), name = tensor<string, []>("layers_2_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
538 tensor<fp16, [1280]> layers_2_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(170860992)))];
539 tensor<fp16, [1, 1280, 1, 1]> var_757_cast_fp16 = conv(bias = layers_2_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_757_dilations_0, groups = var_757_groups_0, pad = var_757_pad_0, pad_type = var_757_pad_type_0, strides = var_757_strides_0, weight = layers_2_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_29_cast_fp16)[name = tensor<string, []>("op_757_cast_fp16")];
540 tensor<string, []> var_763_pad_type_0 = const()[name = tensor<string, []>("op_763_pad_type_0"), val = tensor<string, []>("valid")];
541 tensor<int32, [2]> var_763_strides_0 = const()[name = tensor<string, []>("op_763_strides_0"), val = tensor<int32, [2]>([1, 1])];
542 tensor<int32, [4]> var_763_pad_0 = const()[name = tensor<string, []>("op_763_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
543 tensor<int32, [2]> var_763_dilations_0 = const()[name = tensor<string, []>("op_763_dilations_0"), val = tensor<int32, [2]>([1, 1])];
544 tensor<int32, []> var_763_groups_0 = const()[name = tensor<string, []>("op_763_groups_0"), val = tensor<int32, []>(1)];
545 tensor<fp16, [1280, 1280, 1, 1]> layers_2_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(170876544))), name = tensor<string, []>("layers_2_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [6431]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(170863616))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
546 tensor<fp16, [1, 1280, 1, 1]> var_763_cast_fp16 = conv(dilations = var_763_dilations_0, groups = var_763_groups_0, pad = var_763_pad_0, pad_type = var_763_pad_type_0, strides = var_763_strides_0, weight = layers_2_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_29_cast_fp16)[name = tensor<string, []>("op_763_cast_fp16")];
547 tensor<fp16, [1, 1280, 1, 1]> current_value_5_cast_fp16 = add(x = var_757_cast_fp16, y = var_763_cast_fp16)[name = tensor<string, []>("current_value_5_cast_fp16")];
548 tensor<fp16, [1, 1280, 1, 224]> var_769_cast_fp16 = mul(x = current_key_5_cast_fp16, y = var_159_cast_fp16)[name = tensor<string, []>("op_769_cast_fp16")];
549 tensor<fp16, [1, 1280, 1, 224]> var_771_cast_fp16 = mul(x = var_53_cast_fp16_2, y = var_162_cast_fp16)[name = tensor<string, []>("op_771_cast_fp16")];
550 tensor<fp16, [1, 1280, 1, 224]> key_9_cast_fp16 = add(x = var_769_cast_fp16, y = var_771_cast_fp16)[name = tensor<string, []>("key_9_cast_fp16")];
551 tensor<fp16, [1, 1280, 1, 224]> var_773_cast_fp16 = mul(x = current_value_5_cast_fp16, y = var_159_cast_fp16)[name = tensor<string, []>("op_773_cast_fp16")];
552 tensor<fp16, [1, 1280, 1, 224]> var_775_cast_fp16 = mul(x = var_60_cast_fp16_2, y = var_162_cast_fp16)[name = tensor<string, []>("op_775_cast_fp16")];
553 tensor<fp16, [1, 1280, 1, 224]> value_9_cast_fp16 = add(x = var_773_cast_fp16, y = var_775_cast_fp16)[name = tensor<string, []>("value_9_cast_fp16")];
554 tensor<int32, [4]> var_778 = const()[name = tensor<string, []>("op_778"), val = tensor<int32, [4]>([1, 20, 64, -1])];
555 tensor<fp16, [1, 20, 64, 1]> mh_q_9_cast_fp16 = reshape(shape = var_778, x = query_9_cast_fp16)[name = tensor<string, []>("mh_q_9_cast_fp16")];
556 tensor<fp16, []> var_780_to_fp16 = const()[name = tensor<string, []>("op_780_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
557 tensor<fp16, [1, 20, 64, 1]> var_781_cast_fp16 = mul(x = mh_q_9_cast_fp16, y = var_780_to_fp16)[name = tensor<string, []>("op_781_cast_fp16")];
558 tensor<int32, [4]> var_782 = const()[name = tensor<string, []>("op_782"), val = tensor<int32, [4]>([1, 20, 64, -1])];
559 tensor<fp16, [1, 20, 64, 224]> var_783_cast_fp16 = reshape(shape = var_782, x = key_9_cast_fp16)[name = tensor<string, []>("op_783_cast_fp16")];
560 tensor<bool, []> mh_w_13_transpose_x_0 = const()[name = tensor<string, []>("mh_w_13_transpose_x_0"), val = tensor<bool, []>(true)];
561 tensor<bool, []> mh_w_13_transpose_y_0 = const()[name = tensor<string, []>("mh_w_13_transpose_y_0"), val = tensor<bool, []>(false)];
562 tensor<fp16, [1, 20, 1, 224]> mh_w_13_cast_fp16 = matmul(transpose_x = mh_w_13_transpose_x_0, transpose_y = mh_w_13_transpose_y_0, x = var_781_cast_fp16, y = var_783_cast_fp16)[name = tensor<string, []>("mh_w_13_cast_fp16")];
563 tensor<fp16, [1, 20, 1, 224]> mh_w_15_cast_fp16 = add(x = mh_w_13_cast_fp16, y = var_180_cast_fp16)[name = tensor<string, []>("mh_w_15_cast_fp16")];
564 tensor<fp16, [1, 20, 1, 224]> var_791_cast_fp16 = softmax(axis = var_678, x = mh_w_15_cast_fp16)[name = tensor<string, []>("op_791_cast_fp16")];
565 tensor<int32, [4]> var_792 = const()[name = tensor<string, []>("op_792"), val = tensor<int32, [4]>([1, 20, 64, -1])];
566 tensor<fp16, [1, 20, 64, 224]> var_793_cast_fp16 = reshape(shape = var_792, x = value_9_cast_fp16)[name = tensor<string, []>("op_793_cast_fp16")];
567 tensor<bool, []> attn_9_transpose_x_0 = const()[name = tensor<string, []>("attn_9_transpose_x_0"), val = tensor<bool, []>(false)];
568 tensor<bool, []> attn_9_transpose_y_0 = const()[name = tensor<string, []>("attn_9_transpose_y_0"), val = tensor<bool, []>(true)];
569 tensor<fp16, [1, 20, 64, 1]> attn_9_cast_fp16 = matmul(transpose_x = attn_9_transpose_x_0, transpose_y = attn_9_transpose_y_0, x = var_793_cast_fp16, y = var_791_cast_fp16)[name = tensor<string, []>("attn_9_cast_fp16")];
570 tensor<int32, [4]> var_796 = const()[name = tensor<string, []>("op_796"), val = tensor<int32, [4]>([1, 1280, 1, -1])];
571 tensor<fp16, [1, 1280, 1, 1]> input_21_cast_fp16 = reshape(shape = var_796, x = attn_9_cast_fp16)[name = tensor<string, []>("input_21_cast_fp16")];
572 tensor<string, []> var_806_pad_type_0 = const()[name = tensor<string, []>("op_806_pad_type_0"), val = tensor<string, []>("valid")];
573 tensor<int32, [2]> var_806_strides_0 = const()[name = tensor<string, []>("op_806_strides_0"), val = tensor<int32, [2]>([1, 1])];
574 tensor<int32, [4]> var_806_pad_0 = const()[name = tensor<string, []>("op_806_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
575 tensor<int32, [2]> var_806_dilations_0 = const()[name = tensor<string, []>("op_806_dilations_0"), val = tensor<int32, [2]>([1, 1])];
576 tensor<int32, []> var_806_groups_0 = const()[name = tensor<string, []>("op_806_groups_0"), val = tensor<int32, []>(1)];
577 tensor<fp16, [1280, 1280, 1, 1]> layers_2_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(171081408))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(171900672))), name = tensor<string, []>("layers_2_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
578 tensor<fp16, [1280]> layers_2_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(171900800)))];
579 tensor<fp16, [1, 1280, 1, 1]> var_806_cast_fp16 = conv(bias = layers_2_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_806_dilations_0, groups = var_806_groups_0, pad = var_806_pad_0, pad_type = var_806_pad_type_0, strides = var_806_strides_0, weight = layers_2_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_21_cast_fp16)[name = tensor<string, []>("op_806_cast_fp16")];
580 tensor<string, []> var_812_pad_type_0 = const()[name = tensor<string, []>("op_812_pad_type_0"), val = tensor<string, []>("valid")];
581 tensor<int32, [2]> var_812_strides_0 = const()[name = tensor<string, []>("op_812_strides_0"), val = tensor<int32, [2]>([1, 1])];
582 tensor<int32, [4]> var_812_pad_0 = const()[name = tensor<string, []>("op_812_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
583 tensor<int32, [2]> var_812_dilations_0 = const()[name = tensor<string, []>("op_812_dilations_0"), val = tensor<int32, [2]>([1, 1])];
584 tensor<int32, []> var_812_groups_0 = const()[name = tensor<string, []>("op_812_groups_0"), val = tensor<int32, []>(1)];
585 tensor<fp16, [1280, 1280, 1, 1]> layers_2_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(171914880))), name = tensor<string, []>("layers_2_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5678]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(171903424))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
586 tensor<fp16, [1, 1280, 1, 1]> var_812_cast_fp16 = conv(dilations = var_812_dilations_0, groups = var_812_groups_0, pad = var_812_pad_0, pad_type = var_812_pad_type_0, strides = var_812_strides_0, weight = layers_2_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_21_cast_fp16)[name = tensor<string, []>("op_812_cast_fp16")];
587 tensor<fp16, [1, 1280, 1, 1]> obj_35_cast_fp16 = add(x = var_806_cast_fp16, y = var_812_cast_fp16)[name = tensor<string, []>("obj_35_cast_fp16")];
588 tensor<fp16, [1, 1280, 1, 1]> inputs_15_cast_fp16 = add(x = inputs_13_cast_fp16, y = obj_35_cast_fp16)[name = tensor<string, []>("inputs_15_cast_fp16")];
589 tensor<int32, [1]> out_15_axes_0 = const()[name = tensor<string, []>("out_15_axes_0"), val = tensor<int32, [1]>([1])];
590 tensor<fp16, []> var_827_to_fp16 = const()[name = tensor<string, []>("op_827_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
591 tensor<fp16, [1, 1280, 1, 1]> out_15_cast_fp16 = layer_norm(axes = out_15_axes_0, epsilon = var_827_to_fp16, x = inputs_15_cast_fp16)[name = tensor<string, []>("out_15_cast_fp16")];
592 tensor<fp16, [1280]> obj_37_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_37_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(172119744)))];
593 tensor<fp16, [1280]> obj_37_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_37_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(172122368)))];
594 tensor<fp16, []> obj_37_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_37_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
595 tensor<fp16, [1, 1280, 1, 1]> obj_37_cast_fp16 = batch_norm(beta = obj_37_beta_0_to_fp16, epsilon = obj_37_epsilon_0_to_fp16, gamma = obj_37_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_15_cast_fp16)[name = tensor<string, []>("obj_37_cast_fp16")];
596 tensor<string, []> var_849_pad_type_0 = const()[name = tensor<string, []>("op_849_pad_type_0"), val = tensor<string, []>("valid")];
597 tensor<int32, [2]> var_849_strides_0 = const()[name = tensor<string, []>("op_849_strides_0"), val = tensor<int32, [2]>([1, 1])];
598 tensor<int32, [4]> var_849_pad_0 = const()[name = tensor<string, []>("op_849_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
599 tensor<int32, [2]> var_849_dilations_0 = const()[name = tensor<string, []>("op_849_dilations_0"), val = tensor<int32, [2]>([1, 1])];
600 tensor<int32, []> var_849_groups_0 = const()[name = tensor<string, []>("op_849_groups_0"), val = tensor<int32, []>(1)];
601 tensor<fp16, [1280, 1280, 1, 1]> layers_2_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(172124992))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(172944256))), name = tensor<string, []>("layers_2_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
602 tensor<fp16, [1280]> layers_2_encoder_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_encoder_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(172944384)))];
603 tensor<fp16, [1, 1280, 1, 1]> var_849_cast_fp16 = conv(bias = layers_2_encoder_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_849_dilations_0, groups = var_849_groups_0, pad = var_849_pad_0, pad_type = var_849_pad_type_0, strides = var_849_strides_0, weight = layers_2_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_37_cast_fp16)[name = tensor<string, []>("op_849_cast_fp16")];
604 tensor<string, []> var_855_pad_type_0 = const()[name = tensor<string, []>("op_855_pad_type_0"), val = tensor<string, []>("valid")];
605 tensor<int32, [2]> var_855_strides_0 = const()[name = tensor<string, []>("op_855_strides_0"), val = tensor<int32, [2]>([1, 1])];
606 tensor<int32, [4]> var_855_pad_0 = const()[name = tensor<string, []>("op_855_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
607 tensor<int32, [2]> var_855_dilations_0 = const()[name = tensor<string, []>("op_855_dilations_0"), val = tensor<int32, [2]>([1, 1])];
608 tensor<int32, []> var_855_groups_0 = const()[name = tensor<string, []>("op_855_groups_0"), val = tensor<int32, []>(1)];
609 tensor<fp16, [1280, 1280, 1, 1]> layers_2_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(172974720))), name = tensor<string, []>("layers_2_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [13824]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(172947008))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
610 tensor<fp16, [1, 1280, 1, 1]> var_855_cast_fp16 = conv(dilations = var_855_dilations_0, groups = var_855_groups_0, pad = var_855_pad_0, pad_type = var_855_pad_type_0, strides = var_855_strides_0, weight = layers_2_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_37_cast_fp16)[name = tensor<string, []>("op_855_cast_fp16")];
611 tensor<fp16, [1, 1280, 1, 1]> query_11_cast_fp16 = add(x = var_849_cast_fp16, y = var_855_cast_fp16)[name = tensor<string, []>("query_11_cast_fp16")];
612 tensor<string, []> var_864_pad_type_0 = const()[name = tensor<string, []>("op_864_pad_type_0"), val = tensor<string, []>("valid")];
613 tensor<int32, [2]> var_864_strides_0 = const()[name = tensor<string, []>("op_864_strides_0"), val = tensor<int32, [2]>([1, 1])];
614 tensor<int32, [4]> var_864_pad_0 = const()[name = tensor<string, []>("op_864_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
615 tensor<int32, [2]> var_864_dilations_0 = const()[name = tensor<string, []>("op_864_dilations_0"), val = tensor<int32, [2]>([1, 1])];
616 tensor<int32, []> var_864_groups_0 = const()[name = tensor<string, []>("op_864_groups_0"), val = tensor<int32, []>(1)];
617 tensor<fp16, [1280, 1280, 1, 1]> layers_2_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(173179584))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(173998848))), name = tensor<string, []>("layers_2_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
618 tensor<fp16, [1, 1280, 1, 1500]> var_864_cast_fp16 = conv(dilations = var_864_dilations_0, groups = var_864_groups_0, pad = var_864_pad_0, pad_type = var_864_pad_type_0, strides = var_864_strides_0, weight = layers_2_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor<string, []>("op_864_cast_fp16")];
619 tensor<string, []> var_870_pad_type_0 = const()[name = tensor<string, []>("op_870_pad_type_0"), val = tensor<string, []>("valid")];
620 tensor<int32, [2]> var_870_strides_0 = const()[name = tensor<string, []>("op_870_strides_0"), val = tensor<int32, [2]>([1, 1])];
621 tensor<int32, [4]> var_870_pad_0 = const()[name = tensor<string, []>("op_870_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
622 tensor<int32, [2]> var_870_dilations_0 = const()[name = tensor<string, []>("op_870_dilations_0"), val = tensor<int32, [2]>([1, 1])];
623 tensor<int32, []> var_870_groups_0 = const()[name = tensor<string, []>("op_870_groups_0"), val = tensor<int32, []>(1)];
624 tensor<fp16, [1280, 1280, 1, 1]> layers_2_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(174026816))), name = tensor<string, []>("layers_2_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [13879]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(173998976))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
625 tensor<fp16, [1, 1280, 1, 1500]> var_870_cast_fp16 = conv(dilations = var_870_dilations_0, groups = var_870_groups_0, pad = var_870_pad_0, pad_type = var_870_pad_type_0, strides = var_870_strides_0, weight = layers_2_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = encoder_output_embeds)[name = tensor<string, []>("op_870_cast_fp16")];
626 tensor<fp16, [1, 1280, 1, 1500]> key_11_cast_fp16 = add(x = var_864_cast_fp16, y = var_870_cast_fp16)[name = tensor<string, []>("key_11_cast_fp16")];
627 tensor<string, []> var_880_pad_type_0 = const()[name = tensor<string, []>("op_880_pad_type_0"), val = tensor<string, []>("valid")];
628 tensor<int32, [2]> var_880_strides_0 = const()[name = tensor<string, []>("op_880_strides_0"), val = tensor<int32, [2]>([1, 1])];
629 tensor<int32, [4]> var_880_pad_0 = const()[name = tensor<string, []>("op_880_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
630 tensor<int32, [2]> var_880_dilations_0 = const()[name = tensor<string, []>("op_880_dilations_0"), val = tensor<int32, [2]>([1, 1])];
631 tensor<int32, []> var_880_groups_0 = const()[name = tensor<string, []>("op_880_groups_0"), val = tensor<int32, []>(1)];
632 tensor<fp16, [1280, 1280, 1, 1]> layers_2_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(174231680))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(175050944))), name = tensor<string, []>("layers_2_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
633 tensor<fp16, [1280]> layers_2_encoder_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_encoder_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(175051072)))];
634 tensor<fp16, [1, 1280, 1, 1500]> var_880_cast_fp16 = conv(bias = layers_2_encoder_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_880_dilations_0, groups = var_880_groups_0, pad = var_880_pad_0, pad_type = var_880_pad_type_0, strides = var_880_strides_0, weight = layers_2_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor<string, []>("op_880_cast_fp16")];
635 tensor<string, []> var_886_pad_type_0 = const()[name = tensor<string, []>("op_886_pad_type_0"), val = tensor<string, []>("valid")];
636 tensor<int32, [2]> var_886_strides_0 = const()[name = tensor<string, []>("op_886_strides_0"), val = tensor<int32, [2]>([1, 1])];
637 tensor<int32, [4]> var_886_pad_0 = const()[name = tensor<string, []>("op_886_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
638 tensor<int32, [2]> var_886_dilations_0 = const()[name = tensor<string, []>("op_886_dilations_0"), val = tensor<int32, [2]>([1, 1])];
639 tensor<int32, []> var_886_groups_0 = const()[name = tensor<string, []>("op_886_groups_0"), val = tensor<int32, []>(1)];
640 tensor<fp16, [1280, 1280, 1, 1]> layers_2_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(175065280))), name = tensor<string, []>("layers_2_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5756]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(175053696))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
641 tensor<fp16, [1, 1280, 1, 1500]> var_886_cast_fp16 = conv(dilations = var_886_dilations_0, groups = var_886_groups_0, pad = var_886_pad_0, pad_type = var_886_pad_type_0, strides = var_886_strides_0, weight = layers_2_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = encoder_output_embeds)[name = tensor<string, []>("op_886_cast_fp16")];
642 tensor<fp16, [1, 1280, 1, 1500]> value_11_cast_fp16 = add(x = var_880_cast_fp16, y = var_886_cast_fp16)[name = tensor<string, []>("value_11_cast_fp16")];
643 tensor<int32, [4]> var_889 = const()[name = tensor<string, []>("op_889"), val = tensor<int32, [4]>([1, 20, 64, -1])];
644 tensor<fp16, [1, 20, 64, 1]> mh_q_11_cast_fp16 = reshape(shape = var_889, x = query_11_cast_fp16)[name = tensor<string, []>("mh_q_11_cast_fp16")];
645 tensor<fp16, []> var_891_to_fp16 = const()[name = tensor<string, []>("op_891_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
646 tensor<fp16, [1, 20, 64, 1]> var_892_cast_fp16 = mul(x = mh_q_11_cast_fp16, y = var_891_to_fp16)[name = tensor<string, []>("op_892_cast_fp16")];
647 tensor<int32, [4]> var_893 = const()[name = tensor<string, []>("op_893"), val = tensor<int32, [4]>([1, 20, 64, -1])];
648 tensor<fp16, [1, 20, 64, 1500]> var_894_cast_fp16 = reshape(shape = var_893, x = key_11_cast_fp16)[name = tensor<string, []>("op_894_cast_fp16")];
649 tensor<bool, []> mh_w_17_transpose_x_0 = const()[name = tensor<string, []>("mh_w_17_transpose_x_0"), val = tensor<bool, []>(true)];
650 tensor<bool, []> mh_w_17_transpose_y_0 = const()[name = tensor<string, []>("mh_w_17_transpose_y_0"), val = tensor<bool, []>(false)];
651 tensor<fp16, [1, 20, 1, 1500]> mh_w_17_cast_fp16 = matmul(transpose_x = mh_w_17_transpose_x_0, transpose_y = mh_w_17_transpose_y_0, x = var_892_cast_fp16, y = var_894_cast_fp16)[name = tensor<string, []>("mh_w_17_cast_fp16")];
652 tensor<fp16, [1, 20, 1, 1500]> obj_41_cast_fp16 = softmax(axis = var_678, x = mh_w_17_cast_fp16)[name = tensor<string, []>("obj_41_cast_fp16")];
653 tensor<int32, [4]> var_898 = const()[name = tensor<string, []>("op_898"), val = tensor<int32, [4]>([1, 20, 64, -1])];
654 tensor<fp16, [1, 20, 64, 1500]> var_899_cast_fp16 = reshape(shape = var_898, x = value_11_cast_fp16)[name = tensor<string, []>("op_899_cast_fp16")];
655 tensor<bool, []> attn_11_transpose_x_0 = const()[name = tensor<string, []>("attn_11_transpose_x_0"), val = tensor<bool, []>(false)];
656 tensor<bool, []> attn_11_transpose_y_0 = const()[name = tensor<string, []>("attn_11_transpose_y_0"), val = tensor<bool, []>(true)];
657 tensor<fp16, [1, 20, 64, 1]> attn_11_cast_fp16 = matmul(transpose_x = attn_11_transpose_x_0, transpose_y = attn_11_transpose_y_0, x = var_899_cast_fp16, y = obj_41_cast_fp16)[name = tensor<string, []>("attn_11_cast_fp16")];
658 tensor<int32, [4]> var_902 = const()[name = tensor<string, []>("op_902"), val = tensor<int32, [4]>([1, 1280, 1, -1])];
659 tensor<fp16, [1, 1280, 1, 1]> input_23_cast_fp16 = reshape(shape = var_902, x = attn_11_cast_fp16)[name = tensor<string, []>("input_23_cast_fp16")];
660 tensor<string, []> var_912_pad_type_0 = const()[name = tensor<string, []>("op_912_pad_type_0"), val = tensor<string, []>("valid")];
661 tensor<int32, [2]> var_912_strides_0 = const()[name = tensor<string, []>("op_912_strides_0"), val = tensor<int32, [2]>([1, 1])];
662 tensor<int32, [4]> var_912_pad_0 = const()[name = tensor<string, []>("op_912_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
663 tensor<int32, [2]> var_912_dilations_0 = const()[name = tensor<string, []>("op_912_dilations_0"), val = tensor<int32, [2]>([1, 1])];
664 tensor<int32, []> var_912_groups_0 = const()[name = tensor<string, []>("op_912_groups_0"), val = tensor<int32, []>(1)];
665 tensor<fp16, [1280, 1280, 1, 1]> layers_2_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(175270144))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(176089408))), name = tensor<string, []>("layers_2_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
666 tensor<fp16, [1280]> layers_2_encoder_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_encoder_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(176089536)))];
667 tensor<fp16, [1, 1280, 1, 1]> var_912_cast_fp16 = conv(bias = layers_2_encoder_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_912_dilations_0, groups = var_912_groups_0, pad = var_912_pad_0, pad_type = var_912_pad_type_0, strides = var_912_strides_0, weight = layers_2_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_23_cast_fp16)[name = tensor<string, []>("op_912_cast_fp16")];
668 tensor<string, []> var_918_pad_type_0 = const()[name = tensor<string, []>("op_918_pad_type_0"), val = tensor<string, []>("valid")];
669 tensor<int32, [2]> var_918_strides_0 = const()[name = tensor<string, []>("op_918_strides_0"), val = tensor<int32, [2]>([1, 1])];
670 tensor<int32, [4]> var_918_pad_0 = const()[name = tensor<string, []>("op_918_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
671 tensor<int32, [2]> var_918_dilations_0 = const()[name = tensor<string, []>("op_918_dilations_0"), val = tensor<int32, [2]>([1, 1])];
672 tensor<int32, []> var_918_groups_0 = const()[name = tensor<string, []>("op_918_groups_0"), val = tensor<int32, []>(1)];
673 tensor<fp16, [1280, 1280, 1, 1]> layers_2_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(176105152))), name = tensor<string, []>("layers_2_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [6438]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(176092160))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
674 tensor<fp16, [1, 1280, 1, 1]> var_918_cast_fp16 = conv(dilations = var_918_dilations_0, groups = var_918_groups_0, pad = var_918_pad_0, pad_type = var_918_pad_type_0, strides = var_918_strides_0, weight = layers_2_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_23_cast_fp16)[name = tensor<string, []>("op_918_cast_fp16")];
675 tensor<fp16, [1, 1280, 1, 1]> obj_39_cast_fp16 = add(x = var_912_cast_fp16, y = var_918_cast_fp16)[name = tensor<string, []>("obj_39_cast_fp16")];
676 tensor<fp16, [1, 1280, 1, 1]> inputs_17_cast_fp16 = add(x = inputs_15_cast_fp16, y = obj_39_cast_fp16)[name = tensor<string, []>("inputs_17_cast_fp16")];
677 tensor<int32, [1]> out_17_axes_0 = const()[name = tensor<string, []>("out_17_axes_0"), val = tensor<int32, [1]>([1])];
678 tensor<fp16, []> var_932_to_fp16 = const()[name = tensor<string, []>("op_932_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
679 tensor<fp16, [1, 1280, 1, 1]> out_17_cast_fp16 = layer_norm(axes = out_17_axes_0, epsilon = var_932_to_fp16, x = inputs_17_cast_fp16)[name = tensor<string, []>("out_17_cast_fp16")];
680 tensor<fp16, [1280]> input_25_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_25_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(176310016)))];
681 tensor<fp16, [1280]> input_25_beta_0_to_fp16 = const()[name = tensor<string, []>("input_25_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(176312640)))];
682 tensor<fp16, []> input_25_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_25_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
683 tensor<fp16, [1, 1280, 1, 1]> input_25_cast_fp16 = batch_norm(beta = input_25_beta_0_to_fp16, epsilon = input_25_epsilon_0_to_fp16, gamma = input_25_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_17_cast_fp16)[name = tensor<string, []>("input_25_cast_fp16")];
684 tensor<string, []> var_950_pad_type_0 = const()[name = tensor<string, []>("op_950_pad_type_0"), val = tensor<string, []>("valid")];
685 tensor<int32, [2]> var_950_strides_0 = const()[name = tensor<string, []>("op_950_strides_0"), val = tensor<int32, [2]>([1, 1])];
686 tensor<int32, [4]> var_950_pad_0 = const()[name = tensor<string, []>("op_950_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
687 tensor<int32, [2]> var_950_dilations_0 = const()[name = tensor<string, []>("op_950_dilations_0"), val = tensor<int32, [2]>([1, 1])];
688 tensor<int32, []> var_950_groups_0 = const()[name = tensor<string, []>("op_950_groups_0"), val = tensor<int32, []>(1)];
689 tensor<fp16, [5120, 1280, 1, 1]> layers_2_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [3276800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(176315264))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(179592128))), name = tensor<string, []>("layers_2_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([5120, 1280, 1, 1])];
690 tensor<fp16, [5120]> layers_2_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [5120]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(179592256)))];
691 tensor<fp16, [1, 5120, 1, 1]> var_950_cast_fp16 = conv(bias = layers_2_fc1_inlier_module_bias_to_fp16, dilations = var_950_dilations_0, groups = var_950_groups_0, pad = var_950_pad_0, pad_type = var_950_pad_type_0, strides = var_950_strides_0, weight = layers_2_fc1_inlier_module_weight_to_fp16_palettized, x = input_25_cast_fp16)[name = tensor<string, []>("op_950_cast_fp16")];
692 tensor<string, []> var_956_pad_type_0 = const()[name = tensor<string, []>("op_956_pad_type_0"), val = tensor<string, []>("valid")];
693 tensor<int32, [2]> var_956_strides_0 = const()[name = tensor<string, []>("op_956_strides_0"), val = tensor<int32, [2]>([1, 1])];
694 tensor<int32, [4]> var_956_pad_0 = const()[name = tensor<string, []>("op_956_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
695 tensor<int32, [2]> var_956_dilations_0 = const()[name = tensor<string, []>("op_956_dilations_0"), val = tensor<int32, [2]>([1, 1])];
696 tensor<int32, []> var_956_groups_0 = const()[name = tensor<string, []>("op_956_groups_0"), val = tensor<int32, []>(1)];
697 tensor<fp16, [5120, 1280, 1, 1]> layers_2_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(179764480))), name = tensor<string, []>("layers_2_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [80920]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(179602560))), shape = tensor<uint32, [4]>([5120, 1280, 1, 1])];
698 tensor<fp16, [1, 5120, 1, 1]> var_956_cast_fp16 = conv(dilations = var_956_dilations_0, groups = var_956_groups_0, pad = var_956_pad_0, pad_type = var_956_pad_type_0, strides = var_956_strides_0, weight = layers_2_fc1_outlier_module_weight_to_fp16_sparsified, x = input_25_cast_fp16)[name = tensor<string, []>("op_956_cast_fp16")];
699 tensor<fp16, [1, 5120, 1, 1]> input_27_cast_fp16 = add(x = var_950_cast_fp16, y = var_956_cast_fp16)[name = tensor<string, []>("input_27_cast_fp16")];
700 tensor<string, []> input_29_mode_0 = const()[name = tensor<string, []>("input_29_mode_0"), val = tensor<string, []>("EXACT")];
701 tensor<fp16, [1, 5120, 1, 1]> input_29_cast_fp16 = gelu(mode = input_29_mode_0, x = input_27_cast_fp16)[name = tensor<string, []>("input_29_cast_fp16")];
702 tensor<string, []> var_967_pad_type_0 = const()[name = tensor<string, []>("op_967_pad_type_0"), val = tensor<string, []>("valid")];
703 tensor<int32, [2]> var_967_strides_0 = const()[name = tensor<string, []>("op_967_strides_0"), val = tensor<int32, [2]>([1, 1])];
704 tensor<int32, [4]> var_967_pad_0 = const()[name = tensor<string, []>("op_967_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
705 tensor<int32, [2]> var_967_dilations_0 = const()[name = tensor<string, []>("op_967_dilations_0"), val = tensor<int32, [2]>([1, 1])];
706 tensor<int32, []> var_967_groups_0 = const()[name = tensor<string, []>("op_967_groups_0"), val = tensor<int32, []>(1)];
707 tensor<fp16, [1280, 5120, 1, 1]> layers_2_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [3276800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(180583744))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(183860608))), name = tensor<string, []>("layers_2_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 5120, 1, 1])];
708 tensor<fp16, [1280]> layers_2_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(183860736)))];
709 tensor<fp16, [1, 1280, 1, 1]> var_967_cast_fp16 = conv(bias = layers_2_fc2_inlier_module_bias_to_fp16, dilations = var_967_dilations_0, groups = var_967_groups_0, pad = var_967_pad_0, pad_type = var_967_pad_type_0, strides = var_967_strides_0, weight = layers_2_fc2_inlier_module_weight_to_fp16_palettized, x = input_29_cast_fp16)[name = tensor<string, []>("op_967_cast_fp16")];
710 tensor<string, []> var_973_pad_type_0 = const()[name = tensor<string, []>("op_973_pad_type_0"), val = tensor<string, []>("valid")];
711 tensor<int32, [2]> var_973_strides_0 = const()[name = tensor<string, []>("op_973_strides_0"), val = tensor<int32, [2]>([1, 1])];
712 tensor<int32, [4]> var_973_pad_0 = const()[name = tensor<string, []>("op_973_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
713 tensor<int32, [2]> var_973_dilations_0 = const()[name = tensor<string, []>("op_973_dilations_0"), val = tensor<int32, [2]>([1, 1])];
714 tensor<int32, []> var_973_groups_0 = const()[name = tensor<string, []>("op_973_groups_0"), val = tensor<int32, []>(1)];
715 tensor<fp16, [1280, 5120, 1, 1]> layers_2_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(183943552))), name = tensor<string, []>("layers_2_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [40054]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(183863360))), shape = tensor<uint32, [4]>([1280, 5120, 1, 1])];
716 tensor<fp16, [1, 1280, 1, 1]> var_973_cast_fp16 = conv(dilations = var_973_dilations_0, groups = var_973_groups_0, pad = var_973_pad_0, pad_type = var_973_pad_type_0, strides = var_973_strides_0, weight = layers_2_fc2_outlier_module_weight_to_fp16_sparsified, x = input_29_cast_fp16)[name = tensor<string, []>("op_973_cast_fp16")];
717 tensor<fp16, [1, 1280, 1, 1]> hidden_states_7_cast_fp16 = add(x = var_967_cast_fp16, y = var_973_cast_fp16)[name = tensor<string, []>("hidden_states_7_cast_fp16")];
718 tensor<fp16, [1, 1280, 1, 1]> inputs_19_cast_fp16 = add(x = inputs_17_cast_fp16, y = hidden_states_7_cast_fp16)[name = tensor<string, []>("inputs_19_cast_fp16")];
719 tensor<int32, []> var_986 = const()[name = tensor<string, []>("op_986"), val = tensor<int32, []>(3)];
720 tensor<int32, [1]> out_19_axes_0 = const()[name = tensor<string, []>("out_19_axes_0"), val = tensor<int32, [1]>([1])];
721 tensor<fp16, []> var_1012_to_fp16 = const()[name = tensor<string, []>("op_1012_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
722 tensor<fp16, [1, 1280, 1, 1]> out_19_cast_fp16 = layer_norm(axes = out_19_axes_0, epsilon = var_1012_to_fp16, x = inputs_19_cast_fp16)[name = tensor<string, []>("out_19_cast_fp16")];
723 tensor<fp16, [1280]> obj_43_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_43_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(184762816)))];
724 tensor<fp16, [1280]> obj_43_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_43_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(184765440)))];
725 tensor<fp16, []> obj_43_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_43_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
726 tensor<fp16, [1, 1280, 1, 1]> obj_43_cast_fp16 = batch_norm(beta = obj_43_beta_0_to_fp16, epsilon = obj_43_epsilon_0_to_fp16, gamma = obj_43_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_19_cast_fp16)[name = tensor<string, []>("obj_43_cast_fp16")];
727 tensor<string, []> var_1034_pad_type_0 = const()[name = tensor<string, []>("op_1034_pad_type_0"), val = tensor<string, []>("valid")];
728 tensor<int32, [2]> var_1034_strides_0 = const()[name = tensor<string, []>("op_1034_strides_0"), val = tensor<int32, [2]>([1, 1])];
729 tensor<int32, [4]> var_1034_pad_0 = const()[name = tensor<string, []>("op_1034_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
730 tensor<int32, [2]> var_1034_dilations_0 = const()[name = tensor<string, []>("op_1034_dilations_0"), val = tensor<int32, [2]>([1, 1])];
731 tensor<int32, []> var_1034_groups_0 = const()[name = tensor<string, []>("op_1034_groups_0"), val = tensor<int32, []>(1)];
732 tensor<fp16, [1280, 1280, 1, 1]> layers_3_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(184768064))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(185587328))), name = tensor<string, []>("layers_3_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
733 tensor<fp16, [1280]> layers_3_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(185587456)))];
734 tensor<fp16, [1, 1280, 1, 1]> var_1034_cast_fp16 = conv(bias = layers_3_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_1034_dilations_0, groups = var_1034_groups_0, pad = var_1034_pad_0, pad_type = var_1034_pad_type_0, strides = var_1034_strides_0, weight = layers_3_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_43_cast_fp16)[name = tensor<string, []>("op_1034_cast_fp16")];
735 tensor<string, []> var_1040_pad_type_0 = const()[name = tensor<string, []>("op_1040_pad_type_0"), val = tensor<string, []>("valid")];
736 tensor<int32, [2]> var_1040_strides_0 = const()[name = tensor<string, []>("op_1040_strides_0"), val = tensor<int32, [2]>([1, 1])];
737 tensor<int32, [4]> var_1040_pad_0 = const()[name = tensor<string, []>("op_1040_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
738 tensor<int32, [2]> var_1040_dilations_0 = const()[name = tensor<string, []>("op_1040_dilations_0"), val = tensor<int32, [2]>([1, 1])];
739 tensor<int32, []> var_1040_groups_0 = const()[name = tensor<string, []>("op_1040_groups_0"), val = tensor<int32, []>(1)];
740 tensor<fp16, [1280, 1280, 1, 1]> layers_3_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(185611520))), name = tensor<string, []>("layers_3_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [10664]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(185590080))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
741 tensor<fp16, [1, 1280, 1, 1]> var_1040_cast_fp16 = conv(dilations = var_1040_dilations_0, groups = var_1040_groups_0, pad = var_1040_pad_0, pad_type = var_1040_pad_type_0, strides = var_1040_strides_0, weight = layers_3_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_43_cast_fp16)[name = tensor<string, []>("op_1040_cast_fp16")];
742 tensor<fp16, [1, 1280, 1, 1]> query_13_cast_fp16 = add(x = var_1034_cast_fp16, y = var_1040_cast_fp16)[name = tensor<string, []>("query_13_cast_fp16")];
743 tensor<string, []> var_1049_pad_type_0 = const()[name = tensor<string, []>("op_1049_pad_type_0"), val = tensor<string, []>("valid")];
744 tensor<int32, [2]> var_1049_strides_0 = const()[name = tensor<string, []>("op_1049_strides_0"), val = tensor<int32, [2]>([1, 1])];
745 tensor<int32, [4]> var_1049_pad_0 = const()[name = tensor<string, []>("op_1049_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
746 tensor<int32, [2]> var_1049_dilations_0 = const()[name = tensor<string, []>("op_1049_dilations_0"), val = tensor<int32, [2]>([1, 1])];
747 tensor<int32, []> var_1049_groups_0 = const()[name = tensor<string, []>("op_1049_groups_0"), val = tensor<int32, []>(1)];
748 tensor<fp16, [1280, 1280, 1, 1]> layers_3_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(185816384))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(186635648))), name = tensor<string, []>("layers_3_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
749 tensor<fp16, [1, 1280, 1, 1]> var_1049_cast_fp16 = conv(dilations = var_1049_dilations_0, groups = var_1049_groups_0, pad = var_1049_pad_0, pad_type = var_1049_pad_type_0, strides = var_1049_strides_0, weight = layers_3_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_43_cast_fp16)[name = tensor<string, []>("op_1049_cast_fp16")];
750 tensor<string, []> var_1055_pad_type_0 = const()[name = tensor<string, []>("op_1055_pad_type_0"), val = tensor<string, []>("valid")];
751 tensor<int32, [2]> var_1055_strides_0 = const()[name = tensor<string, []>("op_1055_strides_0"), val = tensor<int32, [2]>([1, 1])];
752 tensor<int32, [4]> var_1055_pad_0 = const()[name = tensor<string, []>("op_1055_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
753 tensor<int32, [2]> var_1055_dilations_0 = const()[name = tensor<string, []>("op_1055_dilations_0"), val = tensor<int32, [2]>([1, 1])];
754 tensor<int32, []> var_1055_groups_0 = const()[name = tensor<string, []>("op_1055_groups_0"), val = tensor<int32, []>(1)];
755 tensor<fp16, [1280, 1280, 1, 1]> layers_3_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(186656640))), name = tensor<string, []>("layers_3_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [10387]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(186635776))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
756 tensor<fp16, [1, 1280, 1, 1]> var_1055_cast_fp16 = conv(dilations = var_1055_dilations_0, groups = var_1055_groups_0, pad = var_1055_pad_0, pad_type = var_1055_pad_type_0, strides = var_1055_strides_0, weight = layers_3_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_43_cast_fp16)[name = tensor<string, []>("op_1055_cast_fp16")];
757 tensor<fp16, [1, 1280, 1, 1]> current_key_cast_fp16 = add(x = var_1049_cast_fp16, y = var_1055_cast_fp16)[name = tensor<string, []>("current_key_cast_fp16")];
758 tensor<string, []> var_1065_pad_type_0 = const()[name = tensor<string, []>("op_1065_pad_type_0"), val = tensor<string, []>("valid")];
759 tensor<int32, [2]> var_1065_strides_0 = const()[name = tensor<string, []>("op_1065_strides_0"), val = tensor<int32, [2]>([1, 1])];
760 tensor<int32, [4]> var_1065_pad_0 = const()[name = tensor<string, []>("op_1065_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
761 tensor<int32, [2]> var_1065_dilations_0 = const()[name = tensor<string, []>("op_1065_dilations_0"), val = tensor<int32, [2]>([1, 1])];
762 tensor<int32, []> var_1065_groups_0 = const()[name = tensor<string, []>("op_1065_groups_0"), val = tensor<int32, []>(1)];
763 tensor<fp16, [1280, 1280, 1, 1]> layers_3_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(186861504))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(187680768))), name = tensor<string, []>("layers_3_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
764 tensor<fp16, [1280]> layers_3_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(187680896)))];
765 tensor<fp16, [1, 1280, 1, 1]> var_1065_cast_fp16 = conv(bias = layers_3_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_1065_dilations_0, groups = var_1065_groups_0, pad = var_1065_pad_0, pad_type = var_1065_pad_type_0, strides = var_1065_strides_0, weight = layers_3_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_43_cast_fp16)[name = tensor<string, []>("op_1065_cast_fp16")];
766 tensor<string, []> var_1071_pad_type_0 = const()[name = tensor<string, []>("op_1071_pad_type_0"), val = tensor<string, []>("valid")];
767 tensor<int32, [2]> var_1071_strides_0 = const()[name = tensor<string, []>("op_1071_strides_0"), val = tensor<int32, [2]>([1, 1])];
768 tensor<int32, [4]> var_1071_pad_0 = const()[name = tensor<string, []>("op_1071_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
769 tensor<int32, [2]> var_1071_dilations_0 = const()[name = tensor<string, []>("op_1071_dilations_0"), val = tensor<int32, [2]>([1, 1])];
770 tensor<int32, []> var_1071_groups_0 = const()[name = tensor<string, []>("op_1071_groups_0"), val = tensor<int32, []>(1)];
771 tensor<fp16, [1280, 1280, 1, 1]> layers_3_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(187698304))), name = tensor<string, []>("layers_3_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [7342]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(187683520))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
772 tensor<fp16, [1, 1280, 1, 1]> var_1071_cast_fp16 = conv(dilations = var_1071_dilations_0, groups = var_1071_groups_0, pad = var_1071_pad_0, pad_type = var_1071_pad_type_0, strides = var_1071_strides_0, weight = layers_3_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_43_cast_fp16)[name = tensor<string, []>("op_1071_cast_fp16")];
773 tensor<fp16, [1, 1280, 1, 1]> current_value_cast_fp16 = add(x = var_1065_cast_fp16, y = var_1071_cast_fp16)[name = tensor<string, []>("current_value_cast_fp16")];
774 tensor<fp16, [1, 1280, 1, 224]> var_1077_cast_fp16 = mul(x = current_key_cast_fp16, y = var_159_cast_fp16)[name = tensor<string, []>("op_1077_cast_fp16")];
775 tensor<fp16, [1, 1280, 1, 224]> var_1079_cast_fp16 = mul(x = var_53_cast_fp16_3, y = var_162_cast_fp16)[name = tensor<string, []>("op_1079_cast_fp16")];
776 tensor<fp16, [1, 1280, 1, 224]> key_13_cast_fp16 = add(x = var_1077_cast_fp16, y = var_1079_cast_fp16)[name = tensor<string, []>("key_13_cast_fp16")];
777 tensor<fp16, [1, 1280, 1, 224]> var_1081_cast_fp16 = mul(x = current_value_cast_fp16, y = var_159_cast_fp16)[name = tensor<string, []>("op_1081_cast_fp16")];
778 tensor<fp16, [1, 1280, 1, 224]> var_1083_cast_fp16 = mul(x = var_60_cast_fp16_3, y = var_162_cast_fp16)[name = tensor<string, []>("op_1083_cast_fp16")];
779 tensor<fp16, [1, 1280, 1, 224]> value_13_cast_fp16 = add(x = var_1081_cast_fp16, y = var_1083_cast_fp16)[name = tensor<string, []>("value_13_cast_fp16")];
780 tensor<int32, [4]> var_1086 = const()[name = tensor<string, []>("op_1086"), val = tensor<int32, [4]>([1, 20, 64, -1])];
781 tensor<fp16, [1, 20, 64, 1]> mh_q_13_cast_fp16 = reshape(shape = var_1086, x = query_13_cast_fp16)[name = tensor<string, []>("mh_q_13_cast_fp16")];
782 tensor<fp16, []> var_1088_to_fp16 = const()[name = tensor<string, []>("op_1088_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
783 tensor<fp16, [1, 20, 64, 1]> var_1089_cast_fp16 = mul(x = mh_q_13_cast_fp16, y = var_1088_to_fp16)[name = tensor<string, []>("op_1089_cast_fp16")];
784 tensor<int32, [4]> var_1090 = const()[name = tensor<string, []>("op_1090"), val = tensor<int32, [4]>([1, 20, 64, -1])];
785 tensor<fp16, [1, 20, 64, 224]> var_1091_cast_fp16 = reshape(shape = var_1090, x = key_13_cast_fp16)[name = tensor<string, []>("op_1091_cast_fp16")];
786 tensor<bool, []> mh_w_19_transpose_x_0 = const()[name = tensor<string, []>("mh_w_19_transpose_x_0"), val = tensor<bool, []>(true)];
787 tensor<bool, []> mh_w_19_transpose_y_0 = const()[name = tensor<string, []>("mh_w_19_transpose_y_0"), val = tensor<bool, []>(false)];
788 tensor<fp16, [1, 20, 1, 224]> mh_w_19_cast_fp16 = matmul(transpose_x = mh_w_19_transpose_x_0, transpose_y = mh_w_19_transpose_y_0, x = var_1089_cast_fp16, y = var_1091_cast_fp16)[name = tensor<string, []>("mh_w_19_cast_fp16")];
789 tensor<fp16, [1, 20, 1, 224]> mh_w_21_cast_fp16 = add(x = mh_w_19_cast_fp16, y = var_180_cast_fp16)[name = tensor<string, []>("mh_w_21_cast_fp16")];
790 tensor<fp16, [1, 20, 1, 224]> var_1099_cast_fp16 = softmax(axis = var_986, x = mh_w_21_cast_fp16)[name = tensor<string, []>("op_1099_cast_fp16")];
791 tensor<int32, [4]> var_1100 = const()[name = tensor<string, []>("op_1100"), val = tensor<int32, [4]>([1, 20, 64, -1])];
792 tensor<fp16, [1, 20, 64, 224]> var_1101_cast_fp16 = reshape(shape = var_1100, x = value_13_cast_fp16)[name = tensor<string, []>("op_1101_cast_fp16")];
793 tensor<bool, []> attn_13_transpose_x_0 = const()[name = tensor<string, []>("attn_13_transpose_x_0"), val = tensor<bool, []>(false)];
794 tensor<bool, []> attn_13_transpose_y_0 = const()[name = tensor<string, []>("attn_13_transpose_y_0"), val = tensor<bool, []>(true)];
795 tensor<fp16, [1, 20, 64, 1]> attn_13_cast_fp16 = matmul(transpose_x = attn_13_transpose_x_0, transpose_y = attn_13_transpose_y_0, x = var_1101_cast_fp16, y = var_1099_cast_fp16)[name = tensor<string, []>("attn_13_cast_fp16")];
796 tensor<int32, [4]> var_1104 = const()[name = tensor<string, []>("op_1104"), val = tensor<int32, [4]>([1, 1280, 1, -1])];
797 tensor<fp16, [1, 1280, 1, 1]> input_31_cast_fp16 = reshape(shape = var_1104, x = attn_13_cast_fp16)[name = tensor<string, []>("input_31_cast_fp16")];
798 tensor<string, []> var_1114_pad_type_0 = const()[name = tensor<string, []>("op_1114_pad_type_0"), val = tensor<string, []>("valid")];
799 tensor<int32, [2]> var_1114_strides_0 = const()[name = tensor<string, []>("op_1114_strides_0"), val = tensor<int32, [2]>([1, 1])];
800 tensor<int32, [4]> var_1114_pad_0 = const()[name = tensor<string, []>("op_1114_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
801 tensor<int32, [2]> var_1114_dilations_0 = const()[name = tensor<string, []>("op_1114_dilations_0"), val = tensor<int32, [2]>([1, 1])];
802 tensor<int32, []> var_1114_groups_0 = const()[name = tensor<string, []>("op_1114_groups_0"), val = tensor<int32, []>(1)];
803 tensor<fp16, [1280, 1280, 1, 1]> layers_3_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(187903168))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(188722432))), name = tensor<string, []>("layers_3_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
804 tensor<fp16, [1280]> layers_3_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(188722560)))];
805 tensor<fp16, [1, 1280, 1, 1]> var_1114_cast_fp16 = conv(bias = layers_3_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_1114_dilations_0, groups = var_1114_groups_0, pad = var_1114_pad_0, pad_type = var_1114_pad_type_0, strides = var_1114_strides_0, weight = layers_3_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_31_cast_fp16)[name = tensor<string, []>("op_1114_cast_fp16")];
806 tensor<string, []> var_1120_pad_type_0 = const()[name = tensor<string, []>("op_1120_pad_type_0"), val = tensor<string, []>("valid")];
807 tensor<int32, [2]> var_1120_strides_0 = const()[name = tensor<string, []>("op_1120_strides_0"), val = tensor<int32, [2]>([1, 1])];
808 tensor<int32, [4]> var_1120_pad_0 = const()[name = tensor<string, []>("op_1120_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
809 tensor<int32, [2]> var_1120_dilations_0 = const()[name = tensor<string, []>("op_1120_dilations_0"), val = tensor<int32, [2]>([1, 1])];
810 tensor<int32, []> var_1120_groups_0 = const()[name = tensor<string, []>("op_1120_groups_0"), val = tensor<int32, []>(1)];
811 tensor<fp16, [1280, 1280, 1, 1]> layers_3_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(188739712))), name = tensor<string, []>("layers_3_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [7219]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(188725184))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
812 tensor<fp16, [1, 1280, 1, 1]> var_1120_cast_fp16 = conv(dilations = var_1120_dilations_0, groups = var_1120_groups_0, pad = var_1120_pad_0, pad_type = var_1120_pad_type_0, strides = var_1120_strides_0, weight = layers_3_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_31_cast_fp16)[name = tensor<string, []>("op_1120_cast_fp16")];
813 tensor<fp16, [1, 1280, 1, 1]> obj_49_cast_fp16 = add(x = var_1114_cast_fp16, y = var_1120_cast_fp16)[name = tensor<string, []>("obj_49_cast_fp16")];
814 tensor<fp16, [1, 1280, 1, 1]> inputs_21_cast_fp16 = add(x = inputs_19_cast_fp16, y = obj_49_cast_fp16)[name = tensor<string, []>("inputs_21_cast_fp16")];
815 tensor<int32, [1]> out_21_axes_0 = const()[name = tensor<string, []>("out_21_axes_0"), val = tensor<int32, [1]>([1])];
816 tensor<fp16, []> var_1135_to_fp16 = const()[name = tensor<string, []>("op_1135_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
817 tensor<fp16, [1, 1280, 1, 1]> out_21_cast_fp16 = layer_norm(axes = out_21_axes_0, epsilon = var_1135_to_fp16, x = inputs_21_cast_fp16)[name = tensor<string, []>("out_21_cast_fp16")];
818 tensor<fp16, [1280]> obj_51_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_51_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(188944576)))];
819 tensor<fp16, [1280]> obj_51_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_51_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(188947200)))];
820 tensor<fp16, []> obj_51_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_51_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
821 tensor<fp16, [1, 1280, 1, 1]> obj_51_cast_fp16 = batch_norm(beta = obj_51_beta_0_to_fp16, epsilon = obj_51_epsilon_0_to_fp16, gamma = obj_51_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_21_cast_fp16)[name = tensor<string, []>("obj_51_cast_fp16")];
822 tensor<string, []> var_1157_pad_type_0 = const()[name = tensor<string, []>("op_1157_pad_type_0"), val = tensor<string, []>("valid")];
823 tensor<int32, [2]> var_1157_strides_0 = const()[name = tensor<string, []>("op_1157_strides_0"), val = tensor<int32, [2]>([1, 1])];
824 tensor<int32, [4]> var_1157_pad_0 = const()[name = tensor<string, []>("op_1157_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
825 tensor<int32, [2]> var_1157_dilations_0 = const()[name = tensor<string, []>("op_1157_dilations_0"), val = tensor<int32, [2]>([1, 1])];
826 tensor<int32, []> var_1157_groups_0 = const()[name = tensor<string, []>("op_1157_groups_0"), val = tensor<int32, []>(1)];
827 tensor<fp16, [1280, 1280, 1, 1]> layers_3_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(188949824))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(189769088))), name = tensor<string, []>("layers_3_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
828 tensor<fp16, [1280]> layers_3_encoder_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_encoder_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(189769216)))];
829 tensor<fp16, [1, 1280, 1, 1]> var_1157_cast_fp16 = conv(bias = layers_3_encoder_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_1157_dilations_0, groups = var_1157_groups_0, pad = var_1157_pad_0, pad_type = var_1157_pad_type_0, strides = var_1157_strides_0, weight = layers_3_encoder_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_51_cast_fp16)[name = tensor<string, []>("op_1157_cast_fp16")];
830 tensor<string, []> var_1163_pad_type_0 = const()[name = tensor<string, []>("op_1163_pad_type_0"), val = tensor<string, []>("valid")];
831 tensor<int32, [2]> var_1163_strides_0 = const()[name = tensor<string, []>("op_1163_strides_0"), val = tensor<int32, [2]>([1, 1])];
832 tensor<int32, [4]> var_1163_pad_0 = const()[name = tensor<string, []>("op_1163_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
833 tensor<int32, [2]> var_1163_dilations_0 = const()[name = tensor<string, []>("op_1163_dilations_0"), val = tensor<int32, [2]>([1, 1])];
834 tensor<int32, []> var_1163_groups_0 = const()[name = tensor<string, []>("op_1163_groups_0"), val = tensor<int32, []>(1)];
835 tensor<fp16, [1280, 1280, 1, 1]> layers_3_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(189787264))), name = tensor<string, []>("layers_3_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [7675]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(189771840))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
836 tensor<fp16, [1, 1280, 1, 1]> var_1163_cast_fp16 = conv(dilations = var_1163_dilations_0, groups = var_1163_groups_0, pad = var_1163_pad_0, pad_type = var_1163_pad_type_0, strides = var_1163_strides_0, weight = layers_3_encoder_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_51_cast_fp16)[name = tensor<string, []>("op_1163_cast_fp16")];
837 tensor<fp16, [1, 1280, 1, 1]> query_cast_fp16 = add(x = var_1157_cast_fp16, y = var_1163_cast_fp16)[name = tensor<string, []>("query_cast_fp16")];
838 tensor<string, []> var_1172_pad_type_0 = const()[name = tensor<string, []>("op_1172_pad_type_0"), val = tensor<string, []>("valid")];
839 tensor<int32, [2]> var_1172_strides_0 = const()[name = tensor<string, []>("op_1172_strides_0"), val = tensor<int32, [2]>([1, 1])];
840 tensor<int32, [4]> var_1172_pad_0 = const()[name = tensor<string, []>("op_1172_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
841 tensor<int32, [2]> var_1172_dilations_0 = const()[name = tensor<string, []>("op_1172_dilations_0"), val = tensor<int32, [2]>([1, 1])];
842 tensor<int32, []> var_1172_groups_0 = const()[name = tensor<string, []>("op_1172_groups_0"), val = tensor<int32, []>(1)];
843 tensor<fp16, [1280, 1280, 1, 1]> layers_3_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(189992128))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(190811392))), name = tensor<string, []>("layers_3_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
844 tensor<fp16, [1, 1280, 1, 1500]> var_1172_cast_fp16 = conv(dilations = var_1172_dilations_0, groups = var_1172_groups_0, pad = var_1172_pad_0, pad_type = var_1172_pad_type_0, strides = var_1172_strides_0, weight = layers_3_encoder_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor<string, []>("op_1172_cast_fp16")];
845 tensor<string, []> var_1178_pad_type_0 = const()[name = tensor<string, []>("op_1178_pad_type_0"), val = tensor<string, []>("valid")];
846 tensor<int32, [2]> var_1178_strides_0 = const()[name = tensor<string, []>("op_1178_strides_0"), val = tensor<int32, [2]>([1, 1])];
847 tensor<int32, [4]> var_1178_pad_0 = const()[name = tensor<string, []>("op_1178_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
848 tensor<int32, [2]> var_1178_dilations_0 = const()[name = tensor<string, []>("op_1178_dilations_0"), val = tensor<int32, [2]>([1, 1])];
849 tensor<int32, []> var_1178_groups_0 = const()[name = tensor<string, []>("op_1178_groups_0"), val = tensor<int32, []>(1)];
850 tensor<fp16, [1280, 1280, 1, 1]> layers_3_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(190834240))), name = tensor<string, []>("layers_3_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [11308]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(190811520))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
851 tensor<fp16, [1, 1280, 1, 1500]> var_1178_cast_fp16 = conv(dilations = var_1178_dilations_0, groups = var_1178_groups_0, pad = var_1178_pad_0, pad_type = var_1178_pad_type_0, strides = var_1178_strides_0, weight = layers_3_encoder_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = encoder_output_embeds)[name = tensor<string, []>("op_1178_cast_fp16")];
852 tensor<fp16, [1, 1280, 1, 1500]> key_cast_fp16 = add(x = var_1172_cast_fp16, y = var_1178_cast_fp16)[name = tensor<string, []>("key_cast_fp16")];
853 tensor<string, []> var_1188_pad_type_0 = const()[name = tensor<string, []>("op_1188_pad_type_0"), val = tensor<string, []>("valid")];
854 tensor<int32, [2]> var_1188_strides_0 = const()[name = tensor<string, []>("op_1188_strides_0"), val = tensor<int32, [2]>([1, 1])];
855 tensor<int32, [4]> var_1188_pad_0 = const()[name = tensor<string, []>("op_1188_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
856 tensor<int32, [2]> var_1188_dilations_0 = const()[name = tensor<string, []>("op_1188_dilations_0"), val = tensor<int32, [2]>([1, 1])];
857 tensor<int32, []> var_1188_groups_0 = const()[name = tensor<string, []>("op_1188_groups_0"), val = tensor<int32, []>(1)];
858 tensor<fp16, [1280, 1280, 1, 1]> layers_3_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(191039104))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(191858368))), name = tensor<string, []>("layers_3_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
859 tensor<fp16, [1280]> layers_3_encoder_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_encoder_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(191858496)))];
860 tensor<fp16, [1, 1280, 1, 1500]> var_1188_cast_fp16 = conv(bias = layers_3_encoder_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_1188_dilations_0, groups = var_1188_groups_0, pad = var_1188_pad_0, pad_type = var_1188_pad_type_0, strides = var_1188_strides_0, weight = layers_3_encoder_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor<string, []>("op_1188_cast_fp16")];
861 tensor<string, []> var_1194_pad_type_0 = const()[name = tensor<string, []>("op_1194_pad_type_0"), val = tensor<string, []>("valid")];
862 tensor<int32, [2]> var_1194_strides_0 = const()[name = tensor<string, []>("op_1194_strides_0"), val = tensor<int32, [2]>([1, 1])];
863 tensor<int32, [4]> var_1194_pad_0 = const()[name = tensor<string, []>("op_1194_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
864 tensor<int32, [2]> var_1194_dilations_0 = const()[name = tensor<string, []>("op_1194_dilations_0"), val = tensor<int32, [2]>([1, 1])];
865 tensor<int32, []> var_1194_groups_0 = const()[name = tensor<string, []>("op_1194_groups_0"), val = tensor<int32, []>(1)];
866 tensor<fp16, [1280, 1280, 1, 1]> layers_3_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(191874944))), name = tensor<string, []>("layers_3_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [6870]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(191861120))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
867 tensor<fp16, [1, 1280, 1, 1500]> var_1194_cast_fp16 = conv(dilations = var_1194_dilations_0, groups = var_1194_groups_0, pad = var_1194_pad_0, pad_type = var_1194_pad_type_0, strides = var_1194_strides_0, weight = layers_3_encoder_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = encoder_output_embeds)[name = tensor<string, []>("op_1194_cast_fp16")];
868 tensor<fp16, [1, 1280, 1, 1500]> value_cast_fp16 = add(x = var_1188_cast_fp16, y = var_1194_cast_fp16)[name = tensor<string, []>("value_cast_fp16")];
869 tensor<int32, [4]> var_1197 = const()[name = tensor<string, []>("op_1197"), val = tensor<int32, [4]>([1, 20, 64, -1])];
870 tensor<fp16, [1, 20, 64, 1]> mh_q_cast_fp16 = reshape(shape = var_1197, x = query_cast_fp16)[name = tensor<string, []>("mh_q_cast_fp16")];
871 tensor<fp16, []> var_1199_to_fp16 = const()[name = tensor<string, []>("op_1199_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
872 tensor<fp16, [1, 20, 64, 1]> var_1200_cast_fp16 = mul(x = mh_q_cast_fp16, y = var_1199_to_fp16)[name = tensor<string, []>("op_1200_cast_fp16")];
873 tensor<int32, [4]> var_1201 = const()[name = tensor<string, []>("op_1201"), val = tensor<int32, [4]>([1, 20, 64, -1])];
874 tensor<fp16, [1, 20, 64, 1500]> var_1202_cast_fp16 = reshape(shape = var_1201, x = key_cast_fp16)[name = tensor<string, []>("op_1202_cast_fp16")];
875 tensor<bool, []> mh_w_transpose_x_0 = const()[name = tensor<string, []>("mh_w_transpose_x_0"), val = tensor<bool, []>(true)];
876 tensor<bool, []> mh_w_transpose_y_0 = const()[name = tensor<string, []>("mh_w_transpose_y_0"), val = tensor<bool, []>(false)];
877 tensor<fp16, [1, 20, 1, 1500]> mh_w_cast_fp16 = matmul(transpose_x = mh_w_transpose_x_0, transpose_y = mh_w_transpose_y_0, x = var_1200_cast_fp16, y = var_1202_cast_fp16)[name = tensor<string, []>("mh_w_cast_fp16")];
878 tensor<fp16, [1, 20, 1, 1500]> obj_55_cast_fp16 = softmax(axis = var_986, x = mh_w_cast_fp16)[name = tensor<string, []>("obj_55_cast_fp16")];
879 tensor<int32, [4]> var_1206 = const()[name = tensor<string, []>("op_1206"), val = tensor<int32, [4]>([1, 20, 64, -1])];
880 tensor<fp16, [1, 20, 64, 1500]> var_1207_cast_fp16 = reshape(shape = var_1206, x = value_cast_fp16)[name = tensor<string, []>("op_1207_cast_fp16")];
881 tensor<bool, []> attn_transpose_x_0 = const()[name = tensor<string, []>("attn_transpose_x_0"), val = tensor<bool, []>(false)];
882 tensor<bool, []> attn_transpose_y_0 = const()[name = tensor<string, []>("attn_transpose_y_0"), val = tensor<bool, []>(true)];
883 tensor<fp16, [1, 20, 64, 1]> attn_cast_fp16 = matmul(transpose_x = attn_transpose_x_0, transpose_y = attn_transpose_y_0, x = var_1207_cast_fp16, y = obj_55_cast_fp16)[name = tensor<string, []>("attn_cast_fp16")];
884 tensor<int32, [4]> var_1210 = const()[name = tensor<string, []>("op_1210"), val = tensor<int32, [4]>([1, 1280, 1, -1])];
885 tensor<fp16, [1, 1280, 1, 1]> input_33_cast_fp16 = reshape(shape = var_1210, x = attn_cast_fp16)[name = tensor<string, []>("input_33_cast_fp16")];
886 tensor<string, []> var_1220_pad_type_0 = const()[name = tensor<string, []>("op_1220_pad_type_0"), val = tensor<string, []>("valid")];
887 tensor<int32, [2]> var_1220_strides_0 = const()[name = tensor<string, []>("op_1220_strides_0"), val = tensor<int32, [2]>([1, 1])];
888 tensor<int32, [4]> var_1220_pad_0 = const()[name = tensor<string, []>("op_1220_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
889 tensor<int32, [2]> var_1220_dilations_0 = const()[name = tensor<string, []>("op_1220_dilations_0"), val = tensor<int32, [2]>([1, 1])];
890 tensor<int32, []> var_1220_groups_0 = const()[name = tensor<string, []>("op_1220_groups_0"), val = tensor<int32, []>(1)];
891 tensor<fp16, [1280, 1280, 1, 1]> layers_3_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(192079808))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(192899072))), name = tensor<string, []>("layers_3_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
892 tensor<fp16, [1280]> layers_3_encoder_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_encoder_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(192899200)))];
893 tensor<fp16, [1, 1280, 1, 1]> var_1220_cast_fp16 = conv(bias = layers_3_encoder_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_1220_dilations_0, groups = var_1220_groups_0, pad = var_1220_pad_0, pad_type = var_1220_pad_type_0, strides = var_1220_strides_0, weight = layers_3_encoder_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_33_cast_fp16)[name = tensor<string, []>("op_1220_cast_fp16")];
894 tensor<string, []> var_1226_pad_type_0 = const()[name = tensor<string, []>("op_1226_pad_type_0"), val = tensor<string, []>("valid")];
895 tensor<int32, [2]> var_1226_strides_0 = const()[name = tensor<string, []>("op_1226_strides_0"), val = tensor<int32, [2]>([1, 1])];
896 tensor<int32, [4]> var_1226_pad_0 = const()[name = tensor<string, []>("op_1226_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
897 tensor<int32, [2]> var_1226_dilations_0 = const()[name = tensor<string, []>("op_1226_dilations_0"), val = tensor<int32, [2]>([1, 1])];
898 tensor<int32, []> var_1226_groups_0 = const()[name = tensor<string, []>("op_1226_groups_0"), val = tensor<int32, []>(1)];
899 tensor<fp16, [1280, 1280, 1, 1]> layers_3_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [204800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(192913536))), name = tensor<string, []>("layers_3_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5809]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(192901824))), shape = tensor<uint32, [4]>([1280, 1280, 1, 1])];
900 tensor<fp16, [1, 1280, 1, 1]> var_1226_cast_fp16 = conv(dilations = var_1226_dilations_0, groups = var_1226_groups_0, pad = var_1226_pad_0, pad_type = var_1226_pad_type_0, strides = var_1226_strides_0, weight = layers_3_encoder_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_33_cast_fp16)[name = tensor<string, []>("op_1226_cast_fp16")];
901 tensor<fp16, [1, 1280, 1, 1]> obj_53_cast_fp16 = add(x = var_1220_cast_fp16, y = var_1226_cast_fp16)[name = tensor<string, []>("obj_53_cast_fp16")];
902 tensor<fp16, [1, 1280, 1, 1]> inputs_23_cast_fp16 = add(x = inputs_21_cast_fp16, y = obj_53_cast_fp16)[name = tensor<string, []>("inputs_23_cast_fp16")];
903 tensor<int32, [1]> out_23_axes_0 = const()[name = tensor<string, []>("out_23_axes_0"), val = tensor<int32, [1]>([1])];
904 tensor<fp16, []> var_1240_to_fp16 = const()[name = tensor<string, []>("op_1240_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
905 tensor<fp16, [1, 1280, 1, 1]> out_23_cast_fp16 = layer_norm(axes = out_23_axes_0, epsilon = var_1240_to_fp16, x = inputs_23_cast_fp16)[name = tensor<string, []>("out_23_cast_fp16")];
906 tensor<fp16, [1280]> input_35_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_35_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(193118400)))];
907 tensor<fp16, [1280]> input_35_beta_0_to_fp16 = const()[name = tensor<string, []>("input_35_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(193121024)))];
908 tensor<fp16, []> input_35_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_35_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
909 tensor<fp16, [1, 1280, 1, 1]> input_35_cast_fp16 = batch_norm(beta = input_35_beta_0_to_fp16, epsilon = input_35_epsilon_0_to_fp16, gamma = input_35_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_23_cast_fp16)[name = tensor<string, []>("input_35_cast_fp16")];
910 tensor<string, []> var_1258_pad_type_0 = const()[name = tensor<string, []>("op_1258_pad_type_0"), val = tensor<string, []>("valid")];
911 tensor<int32, [2]> var_1258_strides_0 = const()[name = tensor<string, []>("op_1258_strides_0"), val = tensor<int32, [2]>([1, 1])];
912 tensor<int32, [4]> var_1258_pad_0 = const()[name = tensor<string, []>("op_1258_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
913 tensor<int32, [2]> var_1258_dilations_0 = const()[name = tensor<string, []>("op_1258_dilations_0"), val = tensor<int32, [2]>([1, 1])];
914 tensor<int32, []> var_1258_groups_0 = const()[name = tensor<string, []>("op_1258_groups_0"), val = tensor<int32, []>(1)];
915 tensor<fp16, [5120, 1280, 1, 1]> layers_3_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [3276800]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(193123648))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(196400512))), name = tensor<string, []>("layers_3_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([5120, 1280, 1, 1])];
916 tensor<fp16, [5120]> layers_3_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [5120]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(196400640)))];
917 tensor<fp16, [1, 5120, 1, 1]> var_1258_cast_fp16 = conv(bias = layers_3_fc1_inlier_module_bias_to_fp16, dilations = var_1258_dilations_0, groups = var_1258_groups_0, pad = var_1258_pad_0, pad_type = var_1258_pad_type_0, strides = var_1258_strides_0, weight = layers_3_fc1_inlier_module_weight_to_fp16_palettized, x = input_35_cast_fp16)[name = tensor<string, []>("op_1258_cast_fp16")];
918 tensor<string, []> var_1264_pad_type_0 = const()[name = tensor<string, []>("op_1264_pad_type_0"), val = tensor<string, []>("valid")];
919 tensor<int32, [2]> var_1264_strides_0 = const()[name = tensor<string, []>("op_1264_strides_0"), val = tensor<int32, [2]>([1, 1])];
920 tensor<int32, [4]> var_1264_pad_0 = const()[name = tensor<string, []>("op_1264_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
921 tensor<int32, [2]> var_1264_dilations_0 = const()[name = tensor<string, []>("op_1264_dilations_0"), val = tensor<int32, [2]>([1, 1])];
922 tensor<int32, []> var_1264_groups_0 = const()[name = tensor<string, []>("op_1264_groups_0"), val = tensor<int32, []>(1)];
923 tensor<fp16, [5120, 1280, 1, 1]> layers_3_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(196463680))), name = tensor<string, []>("layers_3_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [26331]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(196410944))), shape = tensor<uint32, [4]>([5120, 1280, 1, 1])];
924 tensor<fp16, [1, 5120, 1, 1]> var_1264_cast_fp16 = conv(dilations = var_1264_dilations_0, groups = var_1264_groups_0, pad = var_1264_pad_0, pad_type = var_1264_pad_type_0, strides = var_1264_strides_0, weight = layers_3_fc1_outlier_module_weight_to_fp16_sparsified, x = input_35_cast_fp16)[name = tensor<string, []>("op_1264_cast_fp16")];
925 tensor<fp16, [1, 5120, 1, 1]> input_37_cast_fp16 = add(x = var_1258_cast_fp16, y = var_1264_cast_fp16)[name = tensor<string, []>("input_37_cast_fp16")];
926 tensor<string, []> input_mode_0 = const()[name = tensor<string, []>("input_mode_0"), val = tensor<string, []>("EXACT")];
927 tensor<fp16, [1, 5120, 1, 1]> input_cast_fp16 = gelu(mode = input_mode_0, x = input_37_cast_fp16)[name = tensor<string, []>("input_cast_fp16")];
928 tensor<string, []> var_1275_pad_type_0 = const()[name = tensor<string, []>("op_1275_pad_type_0"), val = tensor<string, []>("valid")];
929 tensor<int32, [2]> var_1275_strides_0 = const()[name = tensor<string, []>("op_1275_strides_0"), val = tensor<int32, [2]>([1, 1])];
930 tensor<int32, [4]> var_1275_pad_0 = const()[name = tensor<string, []>("op_1275_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
931 tensor<int32, [2]> var_1275_dilations_0 = const()[name = tensor<string, []>("op_1275_dilations_0"), val = tensor<int32, [2]>([1, 1])];
932 tensor<int32, []> var_1275_groups_0 = const()[name = tensor<string, []>("op_1275_groups_0"), val = tensor<int32, []>(1)];
933 tensor<fp16, [1280, 5120, 1, 1]> layers_3_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [4915200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(197282944))), lut = tensor<fp16, [64]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(202198208))), name = tensor<string, []>("layers_3_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([1280, 5120, 1, 1])];
934 tensor<fp16, [1280]> layers_3_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(202198400)))];
935 tensor<fp16, [1, 1280, 1, 1]> var_1275_cast_fp16 = conv(bias = layers_3_fc2_inlier_module_bias_to_fp16, dilations = var_1275_dilations_0, groups = var_1275_groups_0, pad = var_1275_pad_0, pad_type = var_1275_pad_type_0, strides = var_1275_strides_0, weight = layers_3_fc2_inlier_module_weight_to_fp16_palettized, x = input_cast_fp16)[name = tensor<string, []>("op_1275_cast_fp16")];
936 tensor<string, []> var_1281_pad_type_0 = const()[name = tensor<string, []>("op_1281_pad_type_0"), val = tensor<string, []>("valid")];
937 tensor<int32, [2]> var_1281_strides_0 = const()[name = tensor<string, []>("op_1281_strides_0"), val = tensor<int32, [2]>([1, 1])];
938 tensor<int32, [4]> var_1281_pad_0 = const()[name = tensor<string, []>("op_1281_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
939 tensor<int32, [2]> var_1281_dilations_0 = const()[name = tensor<string, []>("op_1281_dilations_0"), val = tensor<int32, [2]>([1, 1])];
940 tensor<int32, []> var_1281_groups_0 = const()[name = tensor<string, []>("op_1281_groups_0"), val = tensor<int32, []>(1)];
941 tensor<fp16, [1280, 5120, 1, 1]> layers_3_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [819200]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(202271552))), name = tensor<string, []>("layers_3_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [35232]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(202201024))), shape = tensor<uint32, [4]>([1280, 5120, 1, 1])];
942 tensor<fp16, [1, 1280, 1, 1]> var_1281_cast_fp16 = conv(dilations = var_1281_dilations_0, groups = var_1281_groups_0, pad = var_1281_pad_0, pad_type = var_1281_pad_type_0, strides = var_1281_strides_0, weight = layers_3_fc2_outlier_module_weight_to_fp16_sparsified, x = input_cast_fp16)[name = tensor<string, []>("op_1281_cast_fp16")];
943 tensor<fp16, [1, 1280, 1, 1]> hidden_states_9_cast_fp16 = add(x = var_1275_cast_fp16, y = var_1281_cast_fp16)[name = tensor<string, []>("hidden_states_9_cast_fp16")];
944 tensor<fp16, [1, 1280, 1, 1]> inputs_cast_fp16 = add(x = inputs_23_cast_fp16, y = hidden_states_9_cast_fp16)[name = tensor<string, []>("inputs_cast_fp16")];
945 tensor<int32, [1]> out_axes_0 = const()[name = tensor<string, []>("out_axes_0"), val = tensor<int32, [1]>([1])];
946 tensor<fp16, []> var_1301_to_fp16 = const()[name = tensor<string, []>("op_1301_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
947 tensor<fp16, [1, 1280, 1, 1]> out_cast_fp16 = layer_norm(axes = out_axes_0, epsilon = var_1301_to_fp16, x = inputs_cast_fp16)[name = tensor<string, []>("out_cast_fp16")];
948 tensor<fp16, [1280]> hidden_states_gamma_0_to_fp16 = const()[name = tensor<string, []>("hidden_states_gamma_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(203090816)))];
949 tensor<fp16, [1280]> hidden_states_beta_0_to_fp16 = const()[name = tensor<string, []>("hidden_states_beta_0_to_fp16"), val = tensor<fp16, [1280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(203093440)))];
950 tensor<fp16, []> hidden_states_epsilon_0_to_fp16 = const()[name = tensor<string, []>("hidden_states_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
951 tensor<fp16, [1, 1280, 1, 1]> hidden_states_cast_fp16 = batch_norm(beta = hidden_states_beta_0_to_fp16, epsilon = hidden_states_epsilon_0_to_fp16, gamma = hidden_states_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_cast_fp16)[name = tensor<string, []>("hidden_states_cast_fp16")];
952 tensor<int32, [1]> var_1312_axes_0 = const()[name = tensor<string, []>("op_1312_axes_0"), val = tensor<int32, [1]>([2])];
953 tensor<fp16, [1, 1280, 1]> var_1312_cast_fp16 = squeeze(axes = var_1312_axes_0, x = hidden_states_cast_fp16)[name = tensor<string, []>("op_1312_cast_fp16")];
954 tensor<int32, [3]> var_1315_perm_0 = const()[name = tensor<string, []>("op_1315_perm_0"), val = tensor<int32, [3]>([0, 2, 1])];
955 tensor<fp16, [51866]> linear_0_bias_0_to_fp16 = const()[name = tensor<string, []>("linear_0_bias_0_to_fp16"), val = tensor<fp16, [51866]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(203096064)))];
956 tensor<fp16, [1, 1, 1280]> var_1315_cast_fp16 = transpose(perm = var_1315_perm_0, x = var_1312_cast_fp16)[name = tensor<string, []>("transpose_0")];
957 tensor<fp16, [1, 1, 51866]> logits = linear(bias = linear_0_bias_0_to_fp16, weight = embed_tokens_weight_to_fp16, x = var_1315_cast_fp16)[name = tensor<string, []>("linear_0_cast_fp16")];
958 tensor<int32, []> var_1319 = const()[name = tensor<string, []>("op_1319"), val = tensor<int32, []>(1)];
959 tensor<bool, []> obj_59_interleave_0 = const()[name = tensor<string, []>("obj_59_interleave_0"), val = tensor<bool, []>(false)];
960 tensor<fp16, [1, 5120, 1, 1]> key_cache_updates = concat(axis = var_1319, interleave = obj_59_interleave_0, values = (current_key_1_cast_fp16, current_key_3_cast_fp16, current_key_5_cast_fp16, current_key_cast_fp16))[name = tensor<string, []>("obj_59_cast_fp16")];
961 tensor<int32, []> var_1322 = const()[name = tensor<string, []>("op_1322"), val = tensor<int32, []>(1)];
962 tensor<bool, []> obj_61_interleave_0 = const()[name = tensor<string, []>("obj_61_interleave_0"), val = tensor<bool, []>(false)];
963 tensor<fp16, [1, 5120, 1, 1]> value_cache_updates = concat(axis = var_1322, interleave = obj_61_interleave_0, values = (current_value_1_cast_fp16, current_value_3_cast_fp16, current_value_5_cast_fp16, current_value_cast_fp16))[name = tensor<string, []>("obj_61_cast_fp16")];
964 tensor<int32, [4]> var_1333_begin_0 = const()[name = tensor<string, []>("op_1333_begin_0"), val = tensor<int32, [4]>([0, 4, 0, 0])];
965 tensor<int32, [4]> var_1333_end_0 = const()[name = tensor<string, []>("op_1333_end_0"), val = tensor<int32, [4]>([1, 5, 1, 1500])];
966 tensor<bool, [4]> var_1333_end_mask_0 = const()[name = tensor<string, []>("op_1333_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
967 tensor<fp16, [1, 1, 1, 1500]> var_1333_cast_fp16 = slice_by_index(begin = var_1333_begin_0, end = var_1333_end_0, end_mask = var_1333_end_mask_0, x = obj_41_cast_fp16)[name = tensor<string, []>("op_1333_cast_fp16")];
968 tensor<int32, [4]> var_1336_begin_0 = const()[name = tensor<string, []>("op_1336_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
969 tensor<int32, [4]> var_1336_end_0 = const()[name = tensor<string, []>("op_1336_end_0"), val = tensor<int32, [4]>([1, 1, 1, 1500])];
970 tensor<bool, [4]> var_1336_end_mask_0 = const()[name = tensor<string, []>("op_1336_end_mask_0"), val = tensor<bool, [4]>([true, true, false, true])];
971 tensor<bool, [4]> var_1336_squeeze_mask_0 = const()[name = tensor<string, []>("op_1336_squeeze_mask_0"), val = tensor<bool, [4]>([false, false, true, false])];
972 tensor<fp16, [1, 1, 1500]> var_1336_cast_fp16 = slice_by_index(begin = var_1336_begin_0, end = var_1336_end_0, end_mask = var_1336_end_mask_0, squeeze_mask = var_1336_squeeze_mask_0, x = var_1333_cast_fp16)[name = tensor<string, []>("op_1336_cast_fp16")];
973 tensor<int32, [4]> var_1351_begin_0 = const()[name = tensor<string, []>("op_1351_begin_0"), val = tensor<int32, [4]>([0, 11, 0, 0])];
974 tensor<int32, [4]> var_1351_end_0 = const()[name = tensor<string, []>("op_1351_end_0"), val = tensor<int32, [4]>([1, 12, 1, 1500])];
975 tensor<bool, [4]> var_1351_end_mask_0 = const()[name = tensor<string, []>("op_1351_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
976 tensor<fp16, [1, 1, 1, 1500]> var_1351_cast_fp16 = slice_by_index(begin = var_1351_begin_0, end = var_1351_end_0, end_mask = var_1351_end_mask_0, x = obj_41_cast_fp16)[name = tensor<string, []>("op_1351_cast_fp16")];
977 tensor<int32, [4]> var_1354_begin_0 = const()[name = tensor<string, []>("op_1354_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
978 tensor<int32, [4]> var_1354_end_0 = const()[name = tensor<string, []>("op_1354_end_0"), val = tensor<int32, [4]>([1, 1, 1, 1500])];
979 tensor<bool, [4]> var_1354_end_mask_0 = const()[name = tensor<string, []>("op_1354_end_mask_0"), val = tensor<bool, [4]>([true, true, false, true])];
980 tensor<bool, [4]> var_1354_squeeze_mask_0 = const()[name = tensor<string, []>("op_1354_squeeze_mask_0"), val = tensor<bool, [4]>([false, false, true, false])];
981 tensor<fp16, [1, 1, 1500]> var_1354_cast_fp16 = slice_by_index(begin = var_1354_begin_0, end = var_1354_end_0, end_mask = var_1354_end_mask_0, squeeze_mask = var_1354_squeeze_mask_0, x = var_1351_cast_fp16)[name = tensor<string, []>("op_1354_cast_fp16")];
982 tensor<int32, [4]> var_1369_begin_0 = const()[name = tensor<string, []>("op_1369_begin_0"), val = tensor<int32, [4]>([0, 3, 0, 0])];
983 tensor<int32, [4]> var_1369_end_0 = const()[name = tensor<string, []>("op_1369_end_0"), val = tensor<int32, [4]>([1, 4, 1, 1500])];
984 tensor<bool, [4]> var_1369_end_mask_0 = const()[name = tensor<string, []>("op_1369_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
985 tensor<fp16, [1, 1, 1, 1500]> var_1369_cast_fp16 = slice_by_index(begin = var_1369_begin_0, end = var_1369_end_0, end_mask = var_1369_end_mask_0, x = obj_55_cast_fp16)[name = tensor<string, []>("op_1369_cast_fp16")];
986 tensor<int32, [4]> var_1372_begin_0 = const()[name = tensor<string, []>("op_1372_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
987 tensor<int32, [4]> var_1372_end_0 = const()[name = tensor<string, []>("op_1372_end_0"), val = tensor<int32, [4]>([1, 1, 1, 1500])];
988 tensor<bool, [4]> var_1372_end_mask_0 = const()[name = tensor<string, []>("op_1372_end_mask_0"), val = tensor<bool, [4]>([true, true, false, true])];
989 tensor<bool, [4]> var_1372_squeeze_mask_0 = const()[name = tensor<string, []>("op_1372_squeeze_mask_0"), val = tensor<bool, [4]>([false, false, true, false])];
990 tensor<fp16, [1, 1, 1500]> var_1372_cast_fp16 = slice_by_index(begin = var_1372_begin_0, end = var_1372_end_0, end_mask = var_1372_end_mask_0, squeeze_mask = var_1372_squeeze_mask_0, x = var_1369_cast_fp16)[name = tensor<string, []>("op_1372_cast_fp16")];
991 tensor<int32, [4]> var_1387_begin_0 = const()[name = tensor<string, []>("op_1387_begin_0"), val = tensor<int32, [4]>([0, 6, 0, 0])];
992 tensor<int32, [4]> var_1387_end_0 = const()[name = tensor<string, []>("op_1387_end_0"), val = tensor<int32, [4]>([1, 7, 1, 1500])];
993 tensor<bool, [4]> var_1387_end_mask_0 = const()[name = tensor<string, []>("op_1387_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
994 tensor<fp16, [1, 1, 1, 1500]> var_1387_cast_fp16 = slice_by_index(begin = var_1387_begin_0, end = var_1387_end_0, end_mask = var_1387_end_mask_0, x = obj_55_cast_fp16)[name = tensor<string, []>("op_1387_cast_fp16")];
995 tensor<int32, [4]> var_1390_begin_0 = const()[name = tensor<string, []>("op_1390_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
996 tensor<int32, [4]> var_1390_end_0 = const()[name = tensor<string, []>("op_1390_end_0"), val = tensor<int32, [4]>([1, 1, 1, 1500])];
997 tensor<bool, [4]> var_1390_end_mask_0 = const()[name = tensor<string, []>("op_1390_end_mask_0"), val = tensor<bool, [4]>([true, true, false, true])];
998 tensor<bool, [4]> var_1390_squeeze_mask_0 = const()[name = tensor<string, []>("op_1390_squeeze_mask_0"), val = tensor<bool, [4]>([false, false, true, false])];
999 tensor<fp16, [1, 1, 1500]> var_1390_cast_fp16 = slice_by_index(begin = var_1390_begin_0, end = var_1390_end_0, end_mask = var_1390_end_mask_0, squeeze_mask = var_1390_squeeze_mask_0, x = var_1387_cast_fp16)[name = tensor<string, []>("op_1390_cast_fp16")];
1000 tensor<int32, [4]> var_1405_begin_0 = const()[name = tensor<string, []>("op_1405_begin_0"), val = tensor<int32, [4]>([0, 11, 0, 0])];
1001 tensor<int32, [4]> var_1405_end_0 = const()[name = tensor<string, []>("op_1405_end_0"), val = tensor<int32, [4]>([1, 12, 1, 1500])];
1002 tensor<bool, [4]> var_1405_end_mask_0 = const()[name = tensor<string, []>("op_1405_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
1003 tensor<fp16, [1, 1, 1, 1500]> var_1405_cast_fp16 = slice_by_index(begin = var_1405_begin_0, end = var_1405_end_0, end_mask = var_1405_end_mask_0, x = obj_55_cast_fp16)[name = tensor<string, []>("op_1405_cast_fp16")];
1004 tensor<int32, [4]> var_1408_begin_0 = const()[name = tensor<string, []>("op_1408_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
1005 tensor<int32, [4]> var_1408_end_0 = const()[name = tensor<string, []>("op_1408_end_0"), val = tensor<int32, [4]>([1, 1, 1, 1500])];
1006 tensor<bool, [4]> var_1408_end_mask_0 = const()[name = tensor<string, []>("op_1408_end_mask_0"), val = tensor<bool, [4]>([true, true, false, true])];
1007 tensor<bool, [4]> var_1408_squeeze_mask_0 = const()[name = tensor<string, []>("op_1408_squeeze_mask_0"), val = tensor<bool, [4]>([false, false, true, false])];
1008 tensor<fp16, [1, 1, 1500]> var_1408_cast_fp16 = slice_by_index(begin = var_1408_begin_0, end = var_1408_end_0, end_mask = var_1408_end_mask_0, squeeze_mask = var_1408_squeeze_mask_0, x = var_1405_cast_fp16)[name = tensor<string, []>("op_1408_cast_fp16")];
1009 tensor<int32, [4]> var_1423_begin_0 = const()[name = tensor<string, []>("op_1423_begin_0"), val = tensor<int32, [4]>([0, 14, 0, 0])];
1010 tensor<int32, [4]> var_1423_end_0 = const()[name = tensor<string, []>("op_1423_end_0"), val = tensor<int32, [4]>([1, 15, 1, 1500])];
1011 tensor<bool, [4]> var_1423_end_mask_0 = const()[name = tensor<string, []>("op_1423_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
1012 tensor<fp16, [1, 1, 1, 1500]> var_1423_cast_fp16 = slice_by_index(begin = var_1423_begin_0, end = var_1423_end_0, end_mask = var_1423_end_mask_0, x = obj_55_cast_fp16)[name = tensor<string, []>("op_1423_cast_fp16")];
1013 tensor<int32, [4]> var_1426_begin_0 = const()[name = tensor<string, []>("op_1426_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
1014 tensor<int32, [4]> var_1426_end_0 = const()[name = tensor<string, []>("op_1426_end_0"), val = tensor<int32, [4]>([1, 1, 1, 1500])];
1015 tensor<bool, [4]> var_1426_end_mask_0 = const()[name = tensor<string, []>("op_1426_end_mask_0"), val = tensor<bool, [4]>([true, true, false, true])];
1016 tensor<bool, [4]> var_1426_squeeze_mask_0 = const()[name = tensor<string, []>("op_1426_squeeze_mask_0"), val = tensor<bool, [4]>([false, false, true, false])];
1017 tensor<fp16, [1, 1, 1500]> var_1426_cast_fp16 = slice_by_index(begin = var_1426_begin_0, end = var_1426_end_0, end_mask = var_1426_end_mask_0, squeeze_mask = var_1426_squeeze_mask_0, x = var_1423_cast_fp16)[name = tensor<string, []>("op_1426_cast_fp16")];
1018 tensor<int32, []> var_1433 = const()[name = tensor<string, []>("op_1433"), val = tensor<int32, []>(1)];
1019 tensor<bool, []> var_1434_interleave_0 = const()[name = tensor<string, []>("op_1434_interleave_0"), val = tensor<bool, []>(false)];
1020 tensor<fp16, [1, 6, 1500]> var_1434_cast_fp16 = concat(axis = var_1433, interleave = var_1434_interleave_0, values = (var_1336_cast_fp16, var_1354_cast_fp16, var_1372_cast_fp16, var_1390_cast_fp16, var_1408_cast_fp16, var_1426_cast_fp16))[name = tensor<string, []>("op_1434_cast_fp16")];
1021 tensor<bool, []> var_1437 = const()[name = tensor<string, []>("op_1437"), val = tensor<bool, []>(false)];
1022 tensor<int32, [1]> obj_axes_0 = const()[name = tensor<string, []>("obj_axes_0"), val = tensor<int32, [1]>([1])];
1023 tensor<fp16, [1, 1500]> alignment_heads_weights = reduce_mean(axes = obj_axes_0, keep_dims = var_1437, x = var_1434_cast_fp16)[name = tensor<string, []>("obj_cast_fp16")];
1024 } -> (logits, key_cache_updates, value_cache_updates, alignment_heads_weights);
1025 }