openai_whisper-small.en_217MB/AudioEncoder.mlmodelc/model.mil

345.4 KB · 1625 lines · plaintext Raw

1	`program(1.0)`
2	`[buildInfo = dict<tensor<string, []>, tensor<string, []>>({{"coremlc-component-MIL", "3404.16.1"}, {"coremlc-version", "3404.23.1"}})]`
3	`{`
4	`func main<ios16>(tensor<fp16, [1, 80, 1, 3000]> melspectrogram_features) {`
5	`tensor<string, []> var_76_pad_type_0 = const()[name = tensor<string, []>("op_76_pad_type_0"), val = tensor<string, []>("custom")];`
6	`tensor<int32, [4]> var_76_pad_0 = const()[name = tensor<string, []>("op_76_pad_0"), val = tensor<int32, [4]>([0, 0, 1, 1])];`
7	`tensor<int32, [2]> var_76_strides_0 = const()[name = tensor<string, []>("op_76_strides_0"), val = tensor<int32, [2]>([1, 1])];`
8	`tensor<int32, [2]> var_76_dilations_0 = const()[name = tensor<string, []>("op_76_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
9	`tensor<int32, []> var_76_groups_0 = const()[name = tensor<string, []>("op_76_groups_0"), val = tensor<int32, []>(1)];`
10	`tensor<fp16, [768, 80, 1, 3]> var_45_to_fp16 = const()[name = tensor<string, []>("op_45_to_fp16"), val = tensor<fp16, [768, 80, 1, 3]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(64)))];`
11	`tensor<fp16, [768]> var_57_to_fp16 = const()[name = tensor<string, []>("op_57_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(368768)))];`
12	`tensor<fp16, [1, 768, 1, 3000]> var_76_cast_fp16 = conv(bias = var_57_to_fp16, dilations = var_76_dilations_0, groups = var_76_groups_0, pad = var_76_pad_0, pad_type = var_76_pad_type_0, strides = var_76_strides_0, weight = var_45_to_fp16, x = melspectrogram_features)[name = tensor<string, []>("op_76_cast_fp16")];`
13	`tensor<string, []> var_114_pad_type_0 = const()[name = tensor<string, []>("op_114_pad_type_0"), val = tensor<string, []>("custom")];`
14	`tensor<int32, [4]> var_114_pad_0 = const()[name = tensor<string, []>("op_114_pad_0"), val = tensor<int32, [4]>([0, 0, 1, 1])];`
15	`tensor<int32, [2]> var_114_strides_0 = const()[name = tensor<string, []>("op_114_strides_0"), val = tensor<int32, [2]>([1, 1])];`
16	`tensor<int32, [2]> var_114_dilations_0 = const()[name = tensor<string, []>("op_114_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
17	`tensor<int32, []> var_114_groups_0 = const()[name = tensor<string, []>("op_114_groups_0"), val = tensor<int32, []>(1)];`
18	`tensor<fp16, [768, 80, 1, 3]> op_89_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [92160]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(370368))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(462592))), name = tensor<string, []>("op_89_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 80, 1, 3])];`
19	`tensor<fp16, [768]> var_95_to_fp16 = const()[name = tensor<string, []>("op_95_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(462720)))];`
20	`tensor<fp16, [1, 768, 1, 3000]> var_114_cast_fp16 = conv(bias = var_95_to_fp16, dilations = var_114_dilations_0, groups = var_114_groups_0, pad = var_114_pad_0, pad_type = var_114_pad_type_0, strides = var_114_strides_0, weight = op_89_to_fp16_palettized, x = melspectrogram_features)[name = tensor<string, []>("op_114_cast_fp16")];`
21	`tensor<fp16, [1, 768, 1, 3000]> var_116_cast_fp16 = add(x = var_76_cast_fp16, y = var_114_cast_fp16)[name = tensor<string, []>("op_116_cast_fp16")];`
22	`tensor<string, []> hidden_states_1_mode_0 = const()[name = tensor<string, []>("hidden_states_1_mode_0"), val = tensor<string, []>("EXACT")];`
23	`tensor<fp16, [1, 768, 1, 3000]> hidden_states_1_cast_fp16 = gelu(mode = hidden_states_1_mode_0, x = var_116_cast_fp16)[name = tensor<string, []>("hidden_states_1_cast_fp16")];`
24	`tensor<string, []> var_162_pad_type_0 = const()[name = tensor<string, []>("op_162_pad_type_0"), val = tensor<string, []>("custom")];`
25	`tensor<int32, [4]> var_162_pad_0 = const()[name = tensor<string, []>("op_162_pad_0"), val = tensor<int32, [4]>([0, 0, 1, 1])];`
26	`tensor<int32, [2]> var_162_strides_0 = const()[name = tensor<string, []>("op_162_strides_0"), val = tensor<int32, [2]>([2, 2])];`
27	`tensor<int32, [2]> var_162_dilations_0 = const()[name = tensor<string, []>("op_162_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
28	`tensor<int32, []> var_162_groups_0 = const()[name = tensor<string, []>("op_162_groups_0"), val = tensor<int32, []>(1)];`
29	`tensor<fp16, [768, 768, 1, 3]> var_131_to_fp16 = const()[name = tensor<string, []>("op_131_to_fp16"), val = tensor<fp16, [768, 768, 1, 3]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(464320)))];`
30	`tensor<fp16, [1, 768, 1, 1500]> var_162_cast_fp16 = conv(bias = var_57_to_fp16, dilations = var_162_dilations_0, groups = var_162_groups_0, pad = var_162_pad_0, pad_type = var_162_pad_type_0, strides = var_162_strides_0, weight = var_131_to_fp16, x = hidden_states_1_cast_fp16)[name = tensor<string, []>("op_162_cast_fp16")];`
31	`tensor<string, []> var_200_pad_type_0 = const()[name = tensor<string, []>("op_200_pad_type_0"), val = tensor<string, []>("custom")];`
32	`tensor<int32, [4]> var_200_pad_0 = const()[name = tensor<string, []>("op_200_pad_0"), val = tensor<int32, [4]>([0, 0, 1, 1])];`
33	`tensor<int32, [2]> var_200_strides_0 = const()[name = tensor<string, []>("op_200_strides_0"), val = tensor<int32, [2]>([2, 2])];`
34	`tensor<int32, [2]> var_200_dilations_0 = const()[name = tensor<string, []>("op_200_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
35	`tensor<int32, []> var_200_groups_0 = const()[name = tensor<string, []>("op_200_groups_0"), val = tensor<int32, []>(1)];`
36	`tensor<fp16, [768, 768, 1, 3]> op_175_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [884736]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4003328))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4888128))), name = tensor<string, []>("op_175_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 3])];`
37	`tensor<fp16, [768]> var_181_to_fp16 = const()[name = tensor<string, []>("op_181_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4888256)))];`
38	`tensor<fp16, [1, 768, 1, 1500]> var_200_cast_fp16 = conv(bias = var_181_to_fp16, dilations = var_200_dilations_0, groups = var_200_groups_0, pad = var_200_pad_0, pad_type = var_200_pad_type_0, strides = var_200_strides_0, weight = op_175_to_fp16_palettized, x = hidden_states_1_cast_fp16)[name = tensor<string, []>("op_200_cast_fp16")];`
39	`tensor<fp16, [1, 768, 1, 1500]> var_202_cast_fp16 = add(x = var_162_cast_fp16, y = var_200_cast_fp16)[name = tensor<string, []>("op_202_cast_fp16")];`
40	`tensor<string, []> hidden_states_3_mode_0 = const()[name = tensor<string, []>("hidden_states_3_mode_0"), val = tensor<string, []>("EXACT")];`
41	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_3_cast_fp16 = gelu(mode = hidden_states_3_mode_0, x = var_202_cast_fp16)[name = tensor<string, []>("hidden_states_3_cast_fp16")];`
42	`tensor<fp16, [1, 768, 1, 1500]> var_222_to_fp16 = const()[name = tensor<string, []>("op_222_to_fp16"), val = tensor<fp16, [1, 768, 1, 1500]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4889856)))];`
43	`tensor<fp16, [1, 768, 1, 1500]> inputs_1_cast_fp16 = add(x = hidden_states_3_cast_fp16, y = var_222_to_fp16)[name = tensor<string, []>("inputs_1_cast_fp16")];`
44	`tensor<int32, []> var_232 = const()[name = tensor<string, []>("op_232"), val = tensor<int32, []>(3)];`
45	`tensor<int32, [1]> out_1_axes_0 = const()[name = tensor<string, []>("out_1_axes_0"), val = tensor<int32, [1]>([1])];`
46	`tensor<fp16, []> var_254_to_fp16 = const()[name = tensor<string, []>("op_254_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
47	`tensor<fp16, [1, 768, 1, 1500]> out_1_cast_fp16 = layer_norm(axes = out_1_axes_0, epsilon = var_254_to_fp16, x = inputs_1_cast_fp16)[name = tensor<string, []>("out_1_cast_fp16")];`
48	`tensor<fp16, [768]> obj_1_variance_0_to_fp16 = const()[name = tensor<string, []>("obj_1_variance_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7193920)))];`
49	`tensor<fp16, [768]> obj_1_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_1_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7195520)))];`
50	`tensor<fp16, [768]> obj_1_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_1_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7197120)))];`
51	`tensor<fp16, []> obj_1_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_1_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
52	`tensor<fp16, [1, 768, 1, 1500]> obj_1_cast_fp16 = batch_norm(beta = obj_1_beta_0_to_fp16, epsilon = obj_1_epsilon_0_to_fp16, gamma = obj_1_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_1_cast_fp16)[name = tensor<string, []>("obj_1_cast_fp16")];`
53	`tensor<string, []> var_276_pad_type_0 = const()[name = tensor<string, []>("op_276_pad_type_0"), val = tensor<string, []>("valid")];`
54	`tensor<int32, [2]> var_276_strides_0 = const()[name = tensor<string, []>("op_276_strides_0"), val = tensor<int32, [2]>([1, 1])];`
55	`tensor<int32, [4]> var_276_pad_0 = const()[name = tensor<string, []>("op_276_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
56	`tensor<int32, [2]> var_276_dilations_0 = const()[name = tensor<string, []>("op_276_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
57	`tensor<int32, []> var_276_groups_0 = const()[name = tensor<string, []>("op_276_groups_0"), val = tensor<int32, []>(1)];`
58	tensor<fp16, [768, 768, 1, 1]> layers_0_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7198720))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7493696))), name = tensor<string, []>("layers_0_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
59	`tensor<fp16, [768]> layers_0_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7493824)))];`
60	`tensor<fp16, [1, 768, 1, 1500]> var_276_cast_fp16 = conv(bias = layers_0_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_276_dilations_0, groups = var_276_groups_0, pad = var_276_pad_0, pad_type = var_276_pad_type_0, strides = var_276_strides_0, weight = layers_0_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_1_cast_fp16)[name = tensor<string, []>("op_276_cast_fp16")];`
61	`tensor<string, []> var_282_pad_type_0 = const()[name = tensor<string, []>("op_282_pad_type_0"), val = tensor<string, []>("valid")];`
62	`tensor<int32, [2]> var_282_strides_0 = const()[name = tensor<string, []>("op_282_strides_0"), val = tensor<int32, [2]>([1, 1])];`
63	`tensor<int32, [4]> var_282_pad_0 = const()[name = tensor<string, []>("op_282_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
64	`tensor<int32, [2]> var_282_dilations_0 = const()[name = tensor<string, []>("op_282_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
65	`tensor<int32, []> var_282_groups_0 = const()[name = tensor<string, []>("op_282_groups_0"), val = tensor<int32, []>(1)];`
66	tensor<fp16, [768, 768, 1, 1]> layers_0_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7518208))), name = tensor<string, []>("layers_0_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [11338]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7495424))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
67	`tensor<fp16, [1, 768, 1, 1500]> var_282_cast_fp16 = conv(dilations = var_282_dilations_0, groups = var_282_groups_0, pad = var_282_pad_0, pad_type = var_282_pad_type_0, strides = var_282_strides_0, weight = layers_0_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_1_cast_fp16)[name = tensor<string, []>("op_282_cast_fp16")];`
68	`tensor<fp16, [1, 768, 1, 1500]> query_1_cast_fp16 = add(x = var_276_cast_fp16, y = var_282_cast_fp16)[name = tensor<string, []>("query_1_cast_fp16")];`
69	`tensor<string, []> var_291_pad_type_0 = const()[name = tensor<string, []>("op_291_pad_type_0"), val = tensor<string, []>("valid")];`
70	`tensor<int32, [2]> var_291_strides_0 = const()[name = tensor<string, []>("op_291_strides_0"), val = tensor<int32, [2]>([1, 1])];`
71	`tensor<int32, [4]> var_291_pad_0 = const()[name = tensor<string, []>("op_291_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
72	`tensor<int32, [2]> var_291_dilations_0 = const()[name = tensor<string, []>("op_291_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
73	`tensor<int32, []> var_291_groups_0 = const()[name = tensor<string, []>("op_291_groups_0"), val = tensor<int32, []>(1)];`
74	tensor<fp16, [768, 768, 1, 1]> layers_0_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7592000))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7886976))), name = tensor<string, []>("layers_0_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
75	`tensor<fp16, [1, 768, 1, 1500]> var_291_cast_fp16 = conv(dilations = var_291_dilations_0, groups = var_291_groups_0, pad = var_291_pad_0, pad_type = var_291_pad_type_0, strides = var_291_strides_0, weight = layers_0_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_1_cast_fp16)[name = tensor<string, []>("op_291_cast_fp16")];`
76	`tensor<string, []> var_297_pad_type_0 = const()[name = tensor<string, []>("op_297_pad_type_0"), val = tensor<string, []>("valid")];`
77	`tensor<int32, [2]> var_297_strides_0 = const()[name = tensor<string, []>("op_297_strides_0"), val = tensor<int32, [2]>([1, 1])];`
78	`tensor<int32, [4]> var_297_pad_0 = const()[name = tensor<string, []>("op_297_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
79	`tensor<int32, [2]> var_297_dilations_0 = const()[name = tensor<string, []>("op_297_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
80	`tensor<int32, []> var_297_groups_0 = const()[name = tensor<string, []>("op_297_groups_0"), val = tensor<int32, []>(1)];`
81	tensor<fp16, [768, 768, 1, 1]> layers_0_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7908352))), name = tensor<string, []>("layers_0_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [10583]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7887104))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
82	`tensor<fp16, [1, 768, 1, 1500]> var_297_cast_fp16 = conv(dilations = var_297_dilations_0, groups = var_297_groups_0, pad = var_297_pad_0, pad_type = var_297_pad_type_0, strides = var_297_strides_0, weight = layers_0_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_1_cast_fp16)[name = tensor<string, []>("op_297_cast_fp16")];`
83	`tensor<fp16, [1, 768, 1, 1500]> key_1_cast_fp16 = add(x = var_291_cast_fp16, y = var_297_cast_fp16)[name = tensor<string, []>("key_1_cast_fp16")];`
84	`tensor<string, []> var_307_pad_type_0 = const()[name = tensor<string, []>("op_307_pad_type_0"), val = tensor<string, []>("valid")];`
85	`tensor<int32, [2]> var_307_strides_0 = const()[name = tensor<string, []>("op_307_strides_0"), val = tensor<int32, [2]>([1, 1])];`
86	`tensor<int32, [4]> var_307_pad_0 = const()[name = tensor<string, []>("op_307_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
87	`tensor<int32, [2]> var_307_dilations_0 = const()[name = tensor<string, []>("op_307_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
88	`tensor<int32, []> var_307_groups_0 = const()[name = tensor<string, []>("op_307_groups_0"), val = tensor<int32, []>(1)];`
89	tensor<fp16, [768, 768, 1, 1]> layers_0_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7982144))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8277120))), name = tensor<string, []>("layers_0_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
90	`tensor<fp16, [768]> layers_0_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8277248)))];`
91	`tensor<fp16, [1, 768, 1, 1500]> var_307_cast_fp16 = conv(bias = layers_0_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_307_dilations_0, groups = var_307_groups_0, pad = var_307_pad_0, pad_type = var_307_pad_type_0, strides = var_307_strides_0, weight = layers_0_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_1_cast_fp16)[name = tensor<string, []>("op_307_cast_fp16")];`
92	`tensor<string, []> var_313_pad_type_0 = const()[name = tensor<string, []>("op_313_pad_type_0"), val = tensor<string, []>("valid")];`
93	`tensor<int32, [2]> var_313_strides_0 = const()[name = tensor<string, []>("op_313_strides_0"), val = tensor<int32, [2]>([1, 1])];`
94	`tensor<int32, [4]> var_313_pad_0 = const()[name = tensor<string, []>("op_313_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
95	`tensor<int32, [2]> var_313_dilations_0 = const()[name = tensor<string, []>("op_313_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
96	`tensor<int32, []> var_313_groups_0 = const()[name = tensor<string, []>("op_313_groups_0"), val = tensor<int32, []>(1)];`
97	tensor<fp16, [768, 768, 1, 1]> layers_0_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8302400))), name = tensor<string, []>("layers_0_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [11740]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8278848))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
98	`tensor<fp16, [1, 768, 1, 1500]> var_313_cast_fp16 = conv(dilations = var_313_dilations_0, groups = var_313_groups_0, pad = var_313_pad_0, pad_type = var_313_pad_type_0, strides = var_313_strides_0, weight = layers_0_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_1_cast_fp16)[name = tensor<string, []>("op_313_cast_fp16")];`
99	`tensor<fp16, [1, 768, 1, 1500]> value_1_cast_fp16 = add(x = var_307_cast_fp16, y = var_313_cast_fp16)[name = tensor<string, []>("value_1_cast_fp16")];`
100	`tensor<int32, [4]> var_317 = const()[name = tensor<string, []>("op_317"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
101	`tensor<fp16, [1, 12, 64, 1500]> mh_q_1_cast_fp16 = reshape(shape = var_317, x = query_1_cast_fp16)[name = tensor<string, []>("mh_q_1_cast_fp16")];`
102	`tensor<fp16, []> var_319_to_fp16 = const()[name = tensor<string, []>("op_319_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
103	`tensor<fp16, [1, 12, 64, 1500]> var_320_cast_fp16 = mul(x = mh_q_1_cast_fp16, y = var_319_to_fp16)[name = tensor<string, []>("op_320_cast_fp16")];`
104	`tensor<int32, [4]> var_323 = const()[name = tensor<string, []>("op_323"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
105	`tensor<fp16, [1, 12, 64, 1500]> var_324_cast_fp16 = reshape(shape = var_323, x = key_1_cast_fp16)[name = tensor<string, []>("op_324_cast_fp16")];`
106	`tensor<bool, []> mh_w_1_transpose_x_0 = const()[name = tensor<string, []>("mh_w_1_transpose_x_0"), val = tensor<bool, []>(true)];`
107	`tensor<bool, []> mh_w_1_transpose_y_0 = const()[name = tensor<string, []>("mh_w_1_transpose_y_0"), val = tensor<bool, []>(false)];`
108	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_1_cast_fp16 = matmul(transpose_x = mh_w_1_transpose_x_0, transpose_y = mh_w_1_transpose_y_0, x = var_320_cast_fp16, y = var_324_cast_fp16)[name = tensor<string, []>("mh_w_1_cast_fp16")];`
109	`tensor<fp16, [1, 12, 1500, 1500]> var_327_cast_fp16 = softmax(axis = var_232, x = mh_w_1_cast_fp16)[name = tensor<string, []>("op_327_cast_fp16")];`
110	`tensor<int32, [4]> var_328 = const()[name = tensor<string, []>("op_328"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
111	`tensor<fp16, [1, 12, 64, 1500]> var_329_cast_fp16 = reshape(shape = var_328, x = value_1_cast_fp16)[name = tensor<string, []>("op_329_cast_fp16")];`
112	`tensor<bool, []> attn_1_transpose_x_0 = const()[name = tensor<string, []>("attn_1_transpose_x_0"), val = tensor<bool, []>(false)];`
113	`tensor<bool, []> attn_1_transpose_y_0 = const()[name = tensor<string, []>("attn_1_transpose_y_0"), val = tensor<bool, []>(true)];`
114	`tensor<fp16, [1, 12, 64, 1500]> attn_1_cast_fp16 = matmul(transpose_x = attn_1_transpose_x_0, transpose_y = attn_1_transpose_y_0, x = var_329_cast_fp16, y = var_327_cast_fp16)[name = tensor<string, []>("attn_1_cast_fp16")];`
115	`tensor<int32, [4]> var_332 = const()[name = tensor<string, []>("op_332"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
116	`tensor<fp16, [1, 768, 1, 1500]> input_1_cast_fp16 = reshape(shape = var_332, x = attn_1_cast_fp16)[name = tensor<string, []>("input_1_cast_fp16")];`
117	`tensor<string, []> var_342_pad_type_0 = const()[name = tensor<string, []>("op_342_pad_type_0"), val = tensor<string, []>("valid")];`
118	`tensor<int32, [2]> var_342_strides_0 = const()[name = tensor<string, []>("op_342_strides_0"), val = tensor<int32, [2]>([1, 1])];`
119	`tensor<int32, [4]> var_342_pad_0 = const()[name = tensor<string, []>("op_342_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
120	`tensor<int32, [2]> var_342_dilations_0 = const()[name = tensor<string, []>("op_342_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
121	`tensor<int32, []> var_342_groups_0 = const()[name = tensor<string, []>("op_342_groups_0"), val = tensor<int32, []>(1)];`
122	tensor<fp16, [768, 768, 1, 1]> layers_0_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8376192))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8671168))), name = tensor<string, []>("layers_0_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
123	`tensor<fp16, [768]> layers_0_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8671296)))];`
124	`tensor<fp16, [1, 768, 1, 1500]> var_342_cast_fp16 = conv(bias = layers_0_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_342_dilations_0, groups = var_342_groups_0, pad = var_342_pad_0, pad_type = var_342_pad_type_0, strides = var_342_strides_0, weight = layers_0_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_1_cast_fp16)[name = tensor<string, []>("op_342_cast_fp16")];`
125	`tensor<string, []> var_348_pad_type_0 = const()[name = tensor<string, []>("op_348_pad_type_0"), val = tensor<string, []>("valid")];`
126	`tensor<int32, [2]> var_348_strides_0 = const()[name = tensor<string, []>("op_348_strides_0"), val = tensor<int32, [2]>([1, 1])];`
127	`tensor<int32, [4]> var_348_pad_0 = const()[name = tensor<string, []>("op_348_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
128	`tensor<int32, [2]> var_348_dilations_0 = const()[name = tensor<string, []>("op_348_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
129	`tensor<int32, []> var_348_groups_0 = const()[name = tensor<string, []>("op_348_groups_0"), val = tensor<int32, []>(1)];`
130	tensor<fp16, [768, 768, 1, 1]> layers_0_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8692480))), name = tensor<string, []>("layers_0_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [9758]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8672896))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
131	`tensor<fp16, [1, 768, 1, 1500]> var_348_cast_fp16 = conv(dilations = var_348_dilations_0, groups = var_348_groups_0, pad = var_348_pad_0, pad_type = var_348_pad_type_0, strides = var_348_strides_0, weight = layers_0_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_1_cast_fp16)[name = tensor<string, []>("op_348_cast_fp16")];`
132	`tensor<fp16, [1, 768, 1, 1500]> obj_3_cast_fp16 = add(x = var_342_cast_fp16, y = var_348_cast_fp16)[name = tensor<string, []>("obj_3_cast_fp16")];`
133	`tensor<fp16, [1, 768, 1, 1500]> inputs_3_cast_fp16 = add(x = inputs_1_cast_fp16, y = obj_3_cast_fp16)[name = tensor<string, []>("inputs_3_cast_fp16")];`
134	`tensor<int32, [1]> out_3_axes_0 = const()[name = tensor<string, []>("out_3_axes_0"), val = tensor<int32, [1]>([1])];`
135	`tensor<fp16, []> var_359_to_fp16 = const()[name = tensor<string, []>("op_359_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
136	`tensor<fp16, [1, 768, 1, 1500]> out_3_cast_fp16 = layer_norm(axes = out_3_axes_0, epsilon = var_359_to_fp16, x = inputs_3_cast_fp16)[name = tensor<string, []>("out_3_cast_fp16")];`
137	`tensor<fp16, [768]> input_3_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_3_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8766272)))];`
138	`tensor<fp16, [768]> input_3_beta_0_to_fp16 = const()[name = tensor<string, []>("input_3_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8767872)))];`
139	`tensor<fp16, []> input_3_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_3_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
140	`tensor<fp16, [1, 768, 1, 1500]> input_3_cast_fp16 = batch_norm(beta = input_3_beta_0_to_fp16, epsilon = input_3_epsilon_0_to_fp16, gamma = input_3_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_3_cast_fp16)[name = tensor<string, []>("input_3_cast_fp16")];`
141	`tensor<string, []> var_377_pad_type_0 = const()[name = tensor<string, []>("op_377_pad_type_0"), val = tensor<string, []>("valid")];`
142	`tensor<int32, [2]> var_377_strides_0 = const()[name = tensor<string, []>("op_377_strides_0"), val = tensor<int32, [2]>([1, 1])];`
143	`tensor<int32, [4]> var_377_pad_0 = const()[name = tensor<string, []>("op_377_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
144	`tensor<int32, [2]> var_377_dilations_0 = const()[name = tensor<string, []>("op_377_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
145	`tensor<int32, []> var_377_groups_0 = const()[name = tensor<string, []>("op_377_groups_0"), val = tensor<int32, []>(1)];`
146	tensor<fp16, [3072, 768, 1, 1]> layers_0_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8769472))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9949184))), name = tensor<string, []>("layers_0_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
147	`tensor<fp16, [3072]> layers_0_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9949312)))];`
148	`tensor<fp16, [1, 3072, 1, 1500]> var_377_cast_fp16 = conv(bias = layers_0_fc1_inlier_module_bias_to_fp16, dilations = var_377_dilations_0, groups = var_377_groups_0, pad = var_377_pad_0, pad_type = var_377_pad_type_0, strides = var_377_strides_0, weight = layers_0_fc1_inlier_module_weight_to_fp16_palettized, x = input_3_cast_fp16)[name = tensor<string, []>("op_377_cast_fp16")];`
149	`tensor<string, []> var_383_pad_type_0 = const()[name = tensor<string, []>("op_383_pad_type_0"), val = tensor<string, []>("valid")];`
150	`tensor<int32, [2]> var_383_strides_0 = const()[name = tensor<string, []>("op_383_strides_0"), val = tensor<int32, [2]>([1, 1])];`
151	`tensor<int32, [4]> var_383_pad_0 = const()[name = tensor<string, []>("op_383_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
152	`tensor<int32, [2]> var_383_dilations_0 = const()[name = tensor<string, []>("op_383_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
153	`tensor<int32, []> var_383_groups_0 = const()[name = tensor<string, []>("op_383_groups_0"), val = tensor<int32, []>(1)];`
154	tensor<fp16, [3072, 768, 1, 1]> layers_0_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(10044736))), name = tensor<string, []>("layers_0_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [44545]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9955520))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
155	`tensor<fp16, [1, 3072, 1, 1500]> var_383_cast_fp16 = conv(dilations = var_383_dilations_0, groups = var_383_groups_0, pad = var_383_pad_0, pad_type = var_383_pad_type_0, strides = var_383_strides_0, weight = layers_0_fc1_outlier_module_weight_to_fp16_sparsified, x = input_3_cast_fp16)[name = tensor<string, []>("op_383_cast_fp16")];`
156	`tensor<fp16, [1, 3072, 1, 1500]> input_5_cast_fp16 = add(x = var_377_cast_fp16, y = var_383_cast_fp16)[name = tensor<string, []>("input_5_cast_fp16")];`
157	`tensor<string, []> input_7_mode_0 = const()[name = tensor<string, []>("input_7_mode_0"), val = tensor<string, []>("EXACT")];`
158	`tensor<fp16, [1, 3072, 1, 1500]> input_7_cast_fp16 = gelu(mode = input_7_mode_0, x = input_5_cast_fp16)[name = tensor<string, []>("input_7_cast_fp16")];`
159	`tensor<string, []> var_394_pad_type_0 = const()[name = tensor<string, []>("op_394_pad_type_0"), val = tensor<string, []>("valid")];`
160	`tensor<int32, [2]> var_394_strides_0 = const()[name = tensor<string, []>("op_394_strides_0"), val = tensor<int32, [2]>([1, 1])];`
161	`tensor<int32, [4]> var_394_pad_0 = const()[name = tensor<string, []>("op_394_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
162	`tensor<int32, [2]> var_394_dilations_0 = const()[name = tensor<string, []>("op_394_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
163	`tensor<int32, []> var_394_groups_0 = const()[name = tensor<string, []>("op_394_groups_0"), val = tensor<int32, []>(1)];`
164	tensor<fp16, [768, 3072, 1, 1]> layers_0_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(10339712))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11519424))), name = tensor<string, []>("layers_0_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
165	`tensor<fp16, [768]> layers_0_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11519552)))];`
166	`tensor<fp16, [1, 768, 1, 1500]> var_394_cast_fp16 = conv(bias = layers_0_fc2_inlier_module_bias_to_fp16, dilations = var_394_dilations_0, groups = var_394_groups_0, pad = var_394_pad_0, pad_type = var_394_pad_type_0, strides = var_394_strides_0, weight = layers_0_fc2_inlier_module_weight_to_fp16_palettized, x = input_7_cast_fp16)[name = tensor<string, []>("op_394_cast_fp16")];`
167	`tensor<string, []> var_400_pad_type_0 = const()[name = tensor<string, []>("op_400_pad_type_0"), val = tensor<string, []>("valid")];`
168	`tensor<int32, [2]> var_400_strides_0 = const()[name = tensor<string, []>("op_400_strides_0"), val = tensor<int32, [2]>([1, 1])];`
169	`tensor<int32, [4]> var_400_pad_0 = const()[name = tensor<string, []>("op_400_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
170	`tensor<int32, [2]> var_400_dilations_0 = const()[name = tensor<string, []>("op_400_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
171	`tensor<int32, []> var_400_groups_0 = const()[name = tensor<string, []>("op_400_groups_0"), val = tensor<int32, []>(1)];`
172	tensor<fp16, [768, 3072, 1, 1]> layers_0_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11594560))), name = tensor<string, []>("layers_0_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [36651]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11521152))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
173	`tensor<fp16, [1, 768, 1, 1500]> var_400_cast_fp16 = conv(dilations = var_400_dilations_0, groups = var_400_groups_0, pad = var_400_pad_0, pad_type = var_400_pad_type_0, strides = var_400_strides_0, weight = layers_0_fc2_outlier_module_weight_to_fp16_sparsified, x = input_7_cast_fp16)[name = tensor<string, []>("op_400_cast_fp16")];`
174	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_5_cast_fp16 = add(x = var_394_cast_fp16, y = var_400_cast_fp16)[name = tensor<string, []>("hidden_states_5_cast_fp16")];`
175	`tensor<fp16, [1, 768, 1, 1500]> inputs_5_cast_fp16 = add(x = inputs_3_cast_fp16, y = hidden_states_5_cast_fp16)[name = tensor<string, []>("inputs_5_cast_fp16")];`
176	`tensor<int32, []> var_406 = const()[name = tensor<string, []>("op_406"), val = tensor<int32, []>(3)];`
177	`tensor<int32, [1]> out_5_axes_0 = const()[name = tensor<string, []>("out_5_axes_0"), val = tensor<int32, [1]>([1])];`
178	`tensor<fp16, []> var_428_to_fp16 = const()[name = tensor<string, []>("op_428_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
179	`tensor<fp16, [1, 768, 1, 1500]> out_5_cast_fp16 = layer_norm(axes = out_5_axes_0, epsilon = var_428_to_fp16, x = inputs_5_cast_fp16)[name = tensor<string, []>("out_5_cast_fp16")];`
180	`tensor<fp16, [768]> obj_5_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_5_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11889536)))];`
181	`tensor<fp16, [768]> obj_5_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_5_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11891136)))];`
182	`tensor<fp16, []> obj_5_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_5_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
183	`tensor<fp16, [1, 768, 1, 1500]> obj_5_cast_fp16 = batch_norm(beta = obj_5_beta_0_to_fp16, epsilon = obj_5_epsilon_0_to_fp16, gamma = obj_5_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_5_cast_fp16)[name = tensor<string, []>("obj_5_cast_fp16")];`
184	`tensor<string, []> var_450_pad_type_0 = const()[name = tensor<string, []>("op_450_pad_type_0"), val = tensor<string, []>("valid")];`
185	`tensor<int32, [2]> var_450_strides_0 = const()[name = tensor<string, []>("op_450_strides_0"), val = tensor<int32, [2]>([1, 1])];`
186	`tensor<int32, [4]> var_450_pad_0 = const()[name = tensor<string, []>("op_450_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
187	`tensor<int32, [2]> var_450_dilations_0 = const()[name = tensor<string, []>("op_450_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
188	`tensor<int32, []> var_450_groups_0 = const()[name = tensor<string, []>("op_450_groups_0"), val = tensor<int32, []>(1)];`
189	tensor<fp16, [768, 768, 1, 1]> layers_1_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11892736))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12187712))), name = tensor<string, []>("layers_1_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
190	`tensor<fp16, [768]> layers_1_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12187840)))];`
191	`tensor<fp16, [1, 768, 1, 1500]> var_450_cast_fp16 = conv(bias = layers_1_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_450_dilations_0, groups = var_450_groups_0, pad = var_450_pad_0, pad_type = var_450_pad_type_0, strides = var_450_strides_0, weight = layers_1_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_5_cast_fp16)[name = tensor<string, []>("op_450_cast_fp16")];`
192	`tensor<string, []> var_456_pad_type_0 = const()[name = tensor<string, []>("op_456_pad_type_0"), val = tensor<string, []>("valid")];`
193	`tensor<int32, [2]> var_456_strides_0 = const()[name = tensor<string, []>("op_456_strides_0"), val = tensor<int32, [2]>([1, 1])];`
194	`tensor<int32, [4]> var_456_pad_0 = const()[name = tensor<string, []>("op_456_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
195	`tensor<int32, [2]> var_456_dilations_0 = const()[name = tensor<string, []>("op_456_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
196	`tensor<int32, []> var_456_groups_0 = const()[name = tensor<string, []>("op_456_groups_0"), val = tensor<int32, []>(1)];`
197	tensor<fp16, [768, 768, 1, 1]> layers_1_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12206656))), name = tensor<string, []>("layers_1_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [8573]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12189440))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
198	`tensor<fp16, [1, 768, 1, 1500]> var_456_cast_fp16 = conv(dilations = var_456_dilations_0, groups = var_456_groups_0, pad = var_456_pad_0, pad_type = var_456_pad_type_0, strides = var_456_strides_0, weight = layers_1_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_5_cast_fp16)[name = tensor<string, []>("op_456_cast_fp16")];`
199	`tensor<fp16, [1, 768, 1, 1500]> query_3_cast_fp16 = add(x = var_450_cast_fp16, y = var_456_cast_fp16)[name = tensor<string, []>("query_3_cast_fp16")];`
200	`tensor<string, []> var_465_pad_type_0 = const()[name = tensor<string, []>("op_465_pad_type_0"), val = tensor<string, []>("valid")];`
201	`tensor<int32, [2]> var_465_strides_0 = const()[name = tensor<string, []>("op_465_strides_0"), val = tensor<int32, [2]>([1, 1])];`
202	`tensor<int32, [4]> var_465_pad_0 = const()[name = tensor<string, []>("op_465_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
203	`tensor<int32, [2]> var_465_dilations_0 = const()[name = tensor<string, []>("op_465_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
204	`tensor<int32, []> var_465_groups_0 = const()[name = tensor<string, []>("op_465_groups_0"), val = tensor<int32, []>(1)];`
205	tensor<fp16, [768, 768, 1, 1]> layers_1_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12280448))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12575424))), name = tensor<string, []>("layers_1_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
206	`tensor<fp16, [1, 768, 1, 1500]> var_465_cast_fp16 = conv(dilations = var_465_dilations_0, groups = var_465_groups_0, pad = var_465_pad_0, pad_type = var_465_pad_type_0, strides = var_465_strides_0, weight = layers_1_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_5_cast_fp16)[name = tensor<string, []>("op_465_cast_fp16")];`
207	`tensor<string, []> var_471_pad_type_0 = const()[name = tensor<string, []>("op_471_pad_type_0"), val = tensor<string, []>("valid")];`
208	`tensor<int32, [2]> var_471_strides_0 = const()[name = tensor<string, []>("op_471_strides_0"), val = tensor<int32, [2]>([1, 1])];`
209	`tensor<int32, [4]> var_471_pad_0 = const()[name = tensor<string, []>("op_471_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
210	`tensor<int32, [2]> var_471_dilations_0 = const()[name = tensor<string, []>("op_471_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
211	`tensor<int32, []> var_471_groups_0 = const()[name = tensor<string, []>("op_471_groups_0"), val = tensor<int32, []>(1)];`
212	tensor<fp16, [768, 768, 1, 1]> layers_1_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12591360))), name = tensor<string, []>("layers_1_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [7864]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12575552))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
213	`tensor<fp16, [1, 768, 1, 1500]> var_471_cast_fp16 = conv(dilations = var_471_dilations_0, groups = var_471_groups_0, pad = var_471_pad_0, pad_type = var_471_pad_type_0, strides = var_471_strides_0, weight = layers_1_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_5_cast_fp16)[name = tensor<string, []>("op_471_cast_fp16")];`
214	`tensor<fp16, [1, 768, 1, 1500]> key_3_cast_fp16 = add(x = var_465_cast_fp16, y = var_471_cast_fp16)[name = tensor<string, []>("key_3_cast_fp16")];`
215	`tensor<string, []> var_481_pad_type_0 = const()[name = tensor<string, []>("op_481_pad_type_0"), val = tensor<string, []>("valid")];`
216	`tensor<int32, [2]> var_481_strides_0 = const()[name = tensor<string, []>("op_481_strides_0"), val = tensor<int32, [2]>([1, 1])];`
217	`tensor<int32, [4]> var_481_pad_0 = const()[name = tensor<string, []>("op_481_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
218	`tensor<int32, [2]> var_481_dilations_0 = const()[name = tensor<string, []>("op_481_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
219	`tensor<int32, []> var_481_groups_0 = const()[name = tensor<string, []>("op_481_groups_0"), val = tensor<int32, []>(1)];`
220	tensor<fp16, [768, 768, 1, 1]> layers_1_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12665152))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12960128))), name = tensor<string, []>("layers_1_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
221	`tensor<fp16, [768]> layers_1_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12960256)))];`
222	`tensor<fp16, [1, 768, 1, 1500]> var_481_cast_fp16 = conv(bias = layers_1_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_481_dilations_0, groups = var_481_groups_0, pad = var_481_pad_0, pad_type = var_481_pad_type_0, strides = var_481_strides_0, weight = layers_1_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_5_cast_fp16)[name = tensor<string, []>("op_481_cast_fp16")];`
223	`tensor<string, []> var_487_pad_type_0 = const()[name = tensor<string, []>("op_487_pad_type_0"), val = tensor<string, []>("valid")];`
224	`tensor<int32, [2]> var_487_strides_0 = const()[name = tensor<string, []>("op_487_strides_0"), val = tensor<int32, [2]>([1, 1])];`
225	`tensor<int32, [4]> var_487_pad_0 = const()[name = tensor<string, []>("op_487_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
226	`tensor<int32, [2]> var_487_dilations_0 = const()[name = tensor<string, []>("op_487_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
227	`tensor<int32, []> var_487_groups_0 = const()[name = tensor<string, []>("op_487_groups_0"), val = tensor<int32, []>(1)];`
228	tensor<fp16, [768, 768, 1, 1]> layers_1_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12975872))), name = tensor<string, []>("layers_1_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [6964]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(12961856))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
229	`tensor<fp16, [1, 768, 1, 1500]> var_487_cast_fp16 = conv(dilations = var_487_dilations_0, groups = var_487_groups_0, pad = var_487_pad_0, pad_type = var_487_pad_type_0, strides = var_487_strides_0, weight = layers_1_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_5_cast_fp16)[name = tensor<string, []>("op_487_cast_fp16")];`
230	`tensor<fp16, [1, 768, 1, 1500]> value_3_cast_fp16 = add(x = var_481_cast_fp16, y = var_487_cast_fp16)[name = tensor<string, []>("value_3_cast_fp16")];`
231	`tensor<int32, [4]> var_491 = const()[name = tensor<string, []>("op_491"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
232	`tensor<fp16, [1, 12, 64, 1500]> mh_q_3_cast_fp16 = reshape(shape = var_491, x = query_3_cast_fp16)[name = tensor<string, []>("mh_q_3_cast_fp16")];`
233	`tensor<fp16, []> var_493_to_fp16 = const()[name = tensor<string, []>("op_493_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
234	`tensor<fp16, [1, 12, 64, 1500]> var_494_cast_fp16 = mul(x = mh_q_3_cast_fp16, y = var_493_to_fp16)[name = tensor<string, []>("op_494_cast_fp16")];`
235	`tensor<int32, [4]> var_497 = const()[name = tensor<string, []>("op_497"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
236	`tensor<fp16, [1, 12, 64, 1500]> var_498_cast_fp16 = reshape(shape = var_497, x = key_3_cast_fp16)[name = tensor<string, []>("op_498_cast_fp16")];`
237	`tensor<bool, []> mh_w_3_transpose_x_0 = const()[name = tensor<string, []>("mh_w_3_transpose_x_0"), val = tensor<bool, []>(true)];`
238	`tensor<bool, []> mh_w_3_transpose_y_0 = const()[name = tensor<string, []>("mh_w_3_transpose_y_0"), val = tensor<bool, []>(false)];`
239	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_3_cast_fp16 = matmul(transpose_x = mh_w_3_transpose_x_0, transpose_y = mh_w_3_transpose_y_0, x = var_494_cast_fp16, y = var_498_cast_fp16)[name = tensor<string, []>("mh_w_3_cast_fp16")];`
240	`tensor<fp16, [1, 12, 1500, 1500]> var_501_cast_fp16 = softmax(axis = var_406, x = mh_w_3_cast_fp16)[name = tensor<string, []>("op_501_cast_fp16")];`
241	`tensor<int32, [4]> var_502 = const()[name = tensor<string, []>("op_502"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
242	`tensor<fp16, [1, 12, 64, 1500]> var_503_cast_fp16 = reshape(shape = var_502, x = value_3_cast_fp16)[name = tensor<string, []>("op_503_cast_fp16")];`
243	`tensor<bool, []> attn_3_transpose_x_0 = const()[name = tensor<string, []>("attn_3_transpose_x_0"), val = tensor<bool, []>(false)];`
244	`tensor<bool, []> attn_3_transpose_y_0 = const()[name = tensor<string, []>("attn_3_transpose_y_0"), val = tensor<bool, []>(true)];`
245	`tensor<fp16, [1, 12, 64, 1500]> attn_3_cast_fp16 = matmul(transpose_x = attn_3_transpose_x_0, transpose_y = attn_3_transpose_y_0, x = var_503_cast_fp16, y = var_501_cast_fp16)[name = tensor<string, []>("attn_3_cast_fp16")];`
246	`tensor<int32, [4]> var_506 = const()[name = tensor<string, []>("op_506"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
247	`tensor<fp16, [1, 768, 1, 1500]> input_9_cast_fp16 = reshape(shape = var_506, x = attn_3_cast_fp16)[name = tensor<string, []>("input_9_cast_fp16")];`
248	`tensor<string, []> var_516_pad_type_0 = const()[name = tensor<string, []>("op_516_pad_type_0"), val = tensor<string, []>("valid")];`
249	`tensor<int32, [2]> var_516_strides_0 = const()[name = tensor<string, []>("op_516_strides_0"), val = tensor<int32, [2]>([1, 1])];`
250	`tensor<int32, [4]> var_516_pad_0 = const()[name = tensor<string, []>("op_516_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
251	`tensor<int32, [2]> var_516_dilations_0 = const()[name = tensor<string, []>("op_516_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
252	`tensor<int32, []> var_516_groups_0 = const()[name = tensor<string, []>("op_516_groups_0"), val = tensor<int32, []>(1)];`
253	tensor<fp16, [768, 768, 1, 1]> layers_1_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13049664))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13344640))), name = tensor<string, []>("layers_1_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
254	`tensor<fp16, [768]> layers_1_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13344768)))];`
255	`tensor<fp16, [1, 768, 1, 1500]> var_516_cast_fp16 = conv(bias = layers_1_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_516_dilations_0, groups = var_516_groups_0, pad = var_516_pad_0, pad_type = var_516_pad_type_0, strides = var_516_strides_0, weight = layers_1_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_9_cast_fp16)[name = tensor<string, []>("op_516_cast_fp16")];`
256	`tensor<string, []> var_522_pad_type_0 = const()[name = tensor<string, []>("op_522_pad_type_0"), val = tensor<string, []>("valid")];`
257	`tensor<int32, [2]> var_522_strides_0 = const()[name = tensor<string, []>("op_522_strides_0"), val = tensor<int32, [2]>([1, 1])];`
258	`tensor<int32, [4]> var_522_pad_0 = const()[name = tensor<string, []>("op_522_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
259	`tensor<int32, [2]> var_522_dilations_0 = const()[name = tensor<string, []>("op_522_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
260	`tensor<int32, []> var_522_groups_0 = const()[name = tensor<string, []>("op_522_groups_0"), val = tensor<int32, []>(1)];`
261	tensor<fp16, [768, 768, 1, 1]> layers_1_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13357056))), name = tensor<string, []>("layers_1_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5299]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13346368))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
262	`tensor<fp16, [1, 768, 1, 1500]> var_522_cast_fp16 = conv(dilations = var_522_dilations_0, groups = var_522_groups_0, pad = var_522_pad_0, pad_type = var_522_pad_type_0, strides = var_522_strides_0, weight = layers_1_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_9_cast_fp16)[name = tensor<string, []>("op_522_cast_fp16")];`
263	`tensor<fp16, [1, 768, 1, 1500]> obj_7_cast_fp16 = add(x = var_516_cast_fp16, y = var_522_cast_fp16)[name = tensor<string, []>("obj_7_cast_fp16")];`
264	`tensor<fp16, [1, 768, 1, 1500]> inputs_7_cast_fp16 = add(x = inputs_5_cast_fp16, y = obj_7_cast_fp16)[name = tensor<string, []>("inputs_7_cast_fp16")];`
265	`tensor<int32, [1]> out_7_axes_0 = const()[name = tensor<string, []>("out_7_axes_0"), val = tensor<int32, [1]>([1])];`
266	`tensor<fp16, []> var_533_to_fp16 = const()[name = tensor<string, []>("op_533_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
267	`tensor<fp16, [1, 768, 1, 1500]> out_7_cast_fp16 = layer_norm(axes = out_7_axes_0, epsilon = var_533_to_fp16, x = inputs_7_cast_fp16)[name = tensor<string, []>("out_7_cast_fp16")];`
268	`tensor<fp16, [768]> input_11_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_11_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13430848)))];`
269	`tensor<fp16, [768]> input_11_beta_0_to_fp16 = const()[name = tensor<string, []>("input_11_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13432448)))];`
270	`tensor<fp16, []> input_11_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_11_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
271	`tensor<fp16, [1, 768, 1, 1500]> input_11_cast_fp16 = batch_norm(beta = input_11_beta_0_to_fp16, epsilon = input_11_epsilon_0_to_fp16, gamma = input_11_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_7_cast_fp16)[name = tensor<string, []>("input_11_cast_fp16")];`
272	`tensor<string, []> var_551_pad_type_0 = const()[name = tensor<string, []>("op_551_pad_type_0"), val = tensor<string, []>("valid")];`
273	`tensor<int32, [2]> var_551_strides_0 = const()[name = tensor<string, []>("op_551_strides_0"), val = tensor<int32, [2]>([1, 1])];`
274	`tensor<int32, [4]> var_551_pad_0 = const()[name = tensor<string, []>("op_551_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
275	`tensor<int32, [2]> var_551_dilations_0 = const()[name = tensor<string, []>("op_551_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
276	`tensor<int32, []> var_551_groups_0 = const()[name = tensor<string, []>("op_551_groups_0"), val = tensor<int32, []>(1)];`
277	tensor<fp16, [3072, 768, 1, 1]> layers_1_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13434048))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14613760))), name = tensor<string, []>("layers_1_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
278	`tensor<fp16, [3072]> layers_1_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14613888)))];`
279	`tensor<fp16, [1, 3072, 1, 1500]> var_551_cast_fp16 = conv(bias = layers_1_fc1_inlier_module_bias_to_fp16, dilations = var_551_dilations_0, groups = var_551_groups_0, pad = var_551_pad_0, pad_type = var_551_pad_type_0, strides = var_551_strides_0, weight = layers_1_fc1_inlier_module_weight_to_fp16_palettized, x = input_11_cast_fp16)[name = tensor<string, []>("op_551_cast_fp16")];`
280	`tensor<string, []> var_557_pad_type_0 = const()[name = tensor<string, []>("op_557_pad_type_0"), val = tensor<string, []>("valid")];`
281	`tensor<int32, [2]> var_557_strides_0 = const()[name = tensor<string, []>("op_557_strides_0"), val = tensor<int32, [2]>([1, 1])];`
282	`tensor<int32, [4]> var_557_pad_0 = const()[name = tensor<string, []>("op_557_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
283	`tensor<int32, [2]> var_557_dilations_0 = const()[name = tensor<string, []>("op_557_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
284	`tensor<int32, []> var_557_groups_0 = const()[name = tensor<string, []>("op_557_groups_0"), val = tensor<int32, []>(1)];`
285	tensor<fp16, [3072, 768, 1, 1]> layers_1_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14688448))), name = tensor<string, []>("layers_1_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [34117]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14620096))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
286	`tensor<fp16, [1, 3072, 1, 1500]> var_557_cast_fp16 = conv(dilations = var_557_dilations_0, groups = var_557_groups_0, pad = var_557_pad_0, pad_type = var_557_pad_type_0, strides = var_557_strides_0, weight = layers_1_fc1_outlier_module_weight_to_fp16_sparsified, x = input_11_cast_fp16)[name = tensor<string, []>("op_557_cast_fp16")];`
287	`tensor<fp16, [1, 3072, 1, 1500]> input_13_cast_fp16 = add(x = var_551_cast_fp16, y = var_557_cast_fp16)[name = tensor<string, []>("input_13_cast_fp16")];`
288	`tensor<string, []> input_15_mode_0 = const()[name = tensor<string, []>("input_15_mode_0"), val = tensor<string, []>("EXACT")];`
289	`tensor<fp16, [1, 3072, 1, 1500]> input_15_cast_fp16 = gelu(mode = input_15_mode_0, x = input_13_cast_fp16)[name = tensor<string, []>("input_15_cast_fp16")];`
290	`tensor<string, []> var_568_pad_type_0 = const()[name = tensor<string, []>("op_568_pad_type_0"), val = tensor<string, []>("valid")];`
291	`tensor<int32, [2]> var_568_strides_0 = const()[name = tensor<string, []>("op_568_strides_0"), val = tensor<int32, [2]>([1, 1])];`
292	`tensor<int32, [4]> var_568_pad_0 = const()[name = tensor<string, []>("op_568_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
293	`tensor<int32, [2]> var_568_dilations_0 = const()[name = tensor<string, []>("op_568_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
294	`tensor<int32, []> var_568_groups_0 = const()[name = tensor<string, []>("op_568_groups_0"), val = tensor<int32, []>(1)];`
295	tensor<fp16, [768, 3072, 1, 1]> layers_1_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(14983424))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16163136))), name = tensor<string, []>("layers_1_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
296	`tensor<fp16, [768]> layers_1_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16163264)))];`
297	`tensor<fp16, [1, 768, 1, 1500]> var_568_cast_fp16 = conv(bias = layers_1_fc2_inlier_module_bias_to_fp16, dilations = var_568_dilations_0, groups = var_568_groups_0, pad = var_568_pad_0, pad_type = var_568_pad_type_0, strides = var_568_strides_0, weight = layers_1_fc2_inlier_module_weight_to_fp16_palettized, x = input_15_cast_fp16)[name = tensor<string, []>("op_568_cast_fp16")];`
298	`tensor<string, []> var_574_pad_type_0 = const()[name = tensor<string, []>("op_574_pad_type_0"), val = tensor<string, []>("valid")];`
299	`tensor<int32, [2]> var_574_strides_0 = const()[name = tensor<string, []>("op_574_strides_0"), val = tensor<int32, [2]>([1, 1])];`
300	`tensor<int32, [4]> var_574_pad_0 = const()[name = tensor<string, []>("op_574_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
301	`tensor<int32, [2]> var_574_dilations_0 = const()[name = tensor<string, []>("op_574_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
302	`tensor<int32, []> var_574_groups_0 = const()[name = tensor<string, []>("op_574_groups_0"), val = tensor<int32, []>(1)];`
303	tensor<fp16, [768, 3072, 1, 1]> layers_1_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16225152))), name = tensor<string, []>("layers_1_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [30100]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16164864))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
304	`tensor<fp16, [1, 768, 1, 1500]> var_574_cast_fp16 = conv(dilations = var_574_dilations_0, groups = var_574_groups_0, pad = var_574_pad_0, pad_type = var_574_pad_type_0, strides = var_574_strides_0, weight = layers_1_fc2_outlier_module_weight_to_fp16_sparsified, x = input_15_cast_fp16)[name = tensor<string, []>("op_574_cast_fp16")];`
305	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_7_cast_fp16 = add(x = var_568_cast_fp16, y = var_574_cast_fp16)[name = tensor<string, []>("hidden_states_7_cast_fp16")];`
306	`tensor<fp16, [1, 768, 1, 1500]> inputs_9_cast_fp16 = add(x = inputs_7_cast_fp16, y = hidden_states_7_cast_fp16)[name = tensor<string, []>("inputs_9_cast_fp16")];`
307	`tensor<int32, []> var_580 = const()[name = tensor<string, []>("op_580"), val = tensor<int32, []>(3)];`
308	`tensor<int32, [1]> out_9_axes_0 = const()[name = tensor<string, []>("out_9_axes_0"), val = tensor<int32, [1]>([1])];`
309	`tensor<fp16, []> var_602_to_fp16 = const()[name = tensor<string, []>("op_602_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
310	`tensor<fp16, [1, 768, 1, 1500]> out_9_cast_fp16 = layer_norm(axes = out_9_axes_0, epsilon = var_602_to_fp16, x = inputs_9_cast_fp16)[name = tensor<string, []>("out_9_cast_fp16")];`
311	`tensor<fp16, [768]> obj_9_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_9_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16520128)))];`
312	`tensor<fp16, [768]> obj_9_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_9_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16521728)))];`
313	`tensor<fp16, []> obj_9_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_9_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
314	`tensor<fp16, [1, 768, 1, 1500]> obj_9_cast_fp16 = batch_norm(beta = obj_9_beta_0_to_fp16, epsilon = obj_9_epsilon_0_to_fp16, gamma = obj_9_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_9_cast_fp16)[name = tensor<string, []>("obj_9_cast_fp16")];`
315	`tensor<string, []> var_624_pad_type_0 = const()[name = tensor<string, []>("op_624_pad_type_0"), val = tensor<string, []>("valid")];`
316	`tensor<int32, [2]> var_624_strides_0 = const()[name = tensor<string, []>("op_624_strides_0"), val = tensor<int32, [2]>([1, 1])];`
317	`tensor<int32, [4]> var_624_pad_0 = const()[name = tensor<string, []>("op_624_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
318	`tensor<int32, [2]> var_624_dilations_0 = const()[name = tensor<string, []>("op_624_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
319	`tensor<int32, []> var_624_groups_0 = const()[name = tensor<string, []>("op_624_groups_0"), val = tensor<int32, []>(1)];`
320	tensor<fp16, [768, 768, 1, 1]> layers_2_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16523328))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16818304))), name = tensor<string, []>("layers_2_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
321	`tensor<fp16, [768]> layers_2_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16818432)))];`
322	`tensor<fp16, [1, 768, 1, 1500]> var_624_cast_fp16 = conv(bias = layers_2_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_624_dilations_0, groups = var_624_groups_0, pad = var_624_pad_0, pad_type = var_624_pad_type_0, strides = var_624_strides_0, weight = layers_2_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_9_cast_fp16)[name = tensor<string, []>("op_624_cast_fp16")];`
323	`tensor<string, []> var_630_pad_type_0 = const()[name = tensor<string, []>("op_630_pad_type_0"), val = tensor<string, []>("valid")];`
324	`tensor<int32, [2]> var_630_strides_0 = const()[name = tensor<string, []>("op_630_strides_0"), val = tensor<int32, [2]>([1, 1])];`
325	`tensor<int32, [4]> var_630_pad_0 = const()[name = tensor<string, []>("op_630_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
326	`tensor<int32, [2]> var_630_dilations_0 = const()[name = tensor<string, []>("op_630_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
327	`tensor<int32, []> var_630_groups_0 = const()[name = tensor<string, []>("op_630_groups_0"), val = tensor<int32, []>(1)];`
328	tensor<fp16, [768, 768, 1, 1]> layers_2_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16834112))), name = tensor<string, []>("layers_2_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [6978]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16820032))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
329	`tensor<fp16, [1, 768, 1, 1500]> var_630_cast_fp16 = conv(dilations = var_630_dilations_0, groups = var_630_groups_0, pad = var_630_pad_0, pad_type = var_630_pad_type_0, strides = var_630_strides_0, weight = layers_2_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_9_cast_fp16)[name = tensor<string, []>("op_630_cast_fp16")];`
330	`tensor<fp16, [1, 768, 1, 1500]> query_5_cast_fp16 = add(x = var_624_cast_fp16, y = var_630_cast_fp16)[name = tensor<string, []>("query_5_cast_fp16")];`
331	`tensor<string, []> var_639_pad_type_0 = const()[name = tensor<string, []>("op_639_pad_type_0"), val = tensor<string, []>("valid")];`
332	`tensor<int32, [2]> var_639_strides_0 = const()[name = tensor<string, []>("op_639_strides_0"), val = tensor<int32, [2]>([1, 1])];`
333	`tensor<int32, [4]> var_639_pad_0 = const()[name = tensor<string, []>("op_639_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
334	`tensor<int32, [2]> var_639_dilations_0 = const()[name = tensor<string, []>("op_639_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
335	`tensor<int32, []> var_639_groups_0 = const()[name = tensor<string, []>("op_639_groups_0"), val = tensor<int32, []>(1)];`
336	tensor<fp16, [768, 768, 1, 1]> layers_2_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16907904))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17202880))), name = tensor<string, []>("layers_2_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
337	`tensor<fp16, [1, 768, 1, 1500]> var_639_cast_fp16 = conv(dilations = var_639_dilations_0, groups = var_639_groups_0, pad = var_639_pad_0, pad_type = var_639_pad_type_0, strides = var_639_strides_0, weight = layers_2_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_9_cast_fp16)[name = tensor<string, []>("op_639_cast_fp16")];`
338	`tensor<string, []> var_645_pad_type_0 = const()[name = tensor<string, []>("op_645_pad_type_0"), val = tensor<string, []>("valid")];`
339	`tensor<int32, [2]> var_645_strides_0 = const()[name = tensor<string, []>("op_645_strides_0"), val = tensor<int32, [2]>([1, 1])];`
340	`tensor<int32, [4]> var_645_pad_0 = const()[name = tensor<string, []>("op_645_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
341	`tensor<int32, [2]> var_645_dilations_0 = const()[name = tensor<string, []>("op_645_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
342	`tensor<int32, []> var_645_groups_0 = const()[name = tensor<string, []>("op_645_groups_0"), val = tensor<int32, []>(1)];`
343	tensor<fp16, [768, 768, 1, 1]> layers_2_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17216384))), name = tensor<string, []>("layers_2_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [6646]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17203008))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
344	`tensor<fp16, [1, 768, 1, 1500]> var_645_cast_fp16 = conv(dilations = var_645_dilations_0, groups = var_645_groups_0, pad = var_645_pad_0, pad_type = var_645_pad_type_0, strides = var_645_strides_0, weight = layers_2_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_9_cast_fp16)[name = tensor<string, []>("op_645_cast_fp16")];`
345	`tensor<fp16, [1, 768, 1, 1500]> key_5_cast_fp16 = add(x = var_639_cast_fp16, y = var_645_cast_fp16)[name = tensor<string, []>("key_5_cast_fp16")];`
346	`tensor<string, []> var_655_pad_type_0 = const()[name = tensor<string, []>("op_655_pad_type_0"), val = tensor<string, []>("valid")];`
347	`tensor<int32, [2]> var_655_strides_0 = const()[name = tensor<string, []>("op_655_strides_0"), val = tensor<int32, [2]>([1, 1])];`
348	`tensor<int32, [4]> var_655_pad_0 = const()[name = tensor<string, []>("op_655_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
349	`tensor<int32, [2]> var_655_dilations_0 = const()[name = tensor<string, []>("op_655_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
350	`tensor<int32, []> var_655_groups_0 = const()[name = tensor<string, []>("op_655_groups_0"), val = tensor<int32, []>(1)];`
351	tensor<fp16, [768, 768, 1, 1]> layers_2_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17290176))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17585152))), name = tensor<string, []>("layers_2_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
352	`tensor<fp16, [768]> layers_2_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17585280)))];`
353	`tensor<fp16, [1, 768, 1, 1500]> var_655_cast_fp16 = conv(bias = layers_2_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_655_dilations_0, groups = var_655_groups_0, pad = var_655_pad_0, pad_type = var_655_pad_type_0, strides = var_655_strides_0, weight = layers_2_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_9_cast_fp16)[name = tensor<string, []>("op_655_cast_fp16")];`
354	`tensor<string, []> var_661_pad_type_0 = const()[name = tensor<string, []>("op_661_pad_type_0"), val = tensor<string, []>("valid")];`
355	`tensor<int32, [2]> var_661_strides_0 = const()[name = tensor<string, []>("op_661_strides_0"), val = tensor<int32, [2]>([1, 1])];`
356	`tensor<int32, [4]> var_661_pad_0 = const()[name = tensor<string, []>("op_661_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
357	`tensor<int32, [2]> var_661_dilations_0 = const()[name = tensor<string, []>("op_661_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
358	`tensor<int32, []> var_661_groups_0 = const()[name = tensor<string, []>("op_661_groups_0"), val = tensor<int32, []>(1)];`
359	tensor<fp16, [768, 768, 1, 1]> layers_2_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17596992))), name = tensor<string, []>("layers_2_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5006]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17586880))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
360	`tensor<fp16, [1, 768, 1, 1500]> var_661_cast_fp16 = conv(dilations = var_661_dilations_0, groups = var_661_groups_0, pad = var_661_pad_0, pad_type = var_661_pad_type_0, strides = var_661_strides_0, weight = layers_2_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_9_cast_fp16)[name = tensor<string, []>("op_661_cast_fp16")];`
361	`tensor<fp16, [1, 768, 1, 1500]> value_5_cast_fp16 = add(x = var_655_cast_fp16, y = var_661_cast_fp16)[name = tensor<string, []>("value_5_cast_fp16")];`
362	`tensor<int32, [4]> var_665 = const()[name = tensor<string, []>("op_665"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
363	`tensor<fp16, [1, 12, 64, 1500]> mh_q_5_cast_fp16 = reshape(shape = var_665, x = query_5_cast_fp16)[name = tensor<string, []>("mh_q_5_cast_fp16")];`
364	`tensor<fp16, []> var_667_to_fp16 = const()[name = tensor<string, []>("op_667_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
365	`tensor<fp16, [1, 12, 64, 1500]> var_668_cast_fp16 = mul(x = mh_q_5_cast_fp16, y = var_667_to_fp16)[name = tensor<string, []>("op_668_cast_fp16")];`
366	`tensor<int32, [4]> var_671 = const()[name = tensor<string, []>("op_671"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
367	`tensor<fp16, [1, 12, 64, 1500]> var_672_cast_fp16 = reshape(shape = var_671, x = key_5_cast_fp16)[name = tensor<string, []>("op_672_cast_fp16")];`
368	`tensor<bool, []> mh_w_5_transpose_x_0 = const()[name = tensor<string, []>("mh_w_5_transpose_x_0"), val = tensor<bool, []>(true)];`
369	`tensor<bool, []> mh_w_5_transpose_y_0 = const()[name = tensor<string, []>("mh_w_5_transpose_y_0"), val = tensor<bool, []>(false)];`
370	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_5_cast_fp16 = matmul(transpose_x = mh_w_5_transpose_x_0, transpose_y = mh_w_5_transpose_y_0, x = var_668_cast_fp16, y = var_672_cast_fp16)[name = tensor<string, []>("mh_w_5_cast_fp16")];`
371	`tensor<fp16, [1, 12, 1500, 1500]> var_675_cast_fp16 = softmax(axis = var_580, x = mh_w_5_cast_fp16)[name = tensor<string, []>("op_675_cast_fp16")];`
372	`tensor<int32, [4]> var_676 = const()[name = tensor<string, []>("op_676"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
373	`tensor<fp16, [1, 12, 64, 1500]> var_677_cast_fp16 = reshape(shape = var_676, x = value_5_cast_fp16)[name = tensor<string, []>("op_677_cast_fp16")];`
374	`tensor<bool, []> attn_5_transpose_x_0 = const()[name = tensor<string, []>("attn_5_transpose_x_0"), val = tensor<bool, []>(false)];`
375	`tensor<bool, []> attn_5_transpose_y_0 = const()[name = tensor<string, []>("attn_5_transpose_y_0"), val = tensor<bool, []>(true)];`
376	`tensor<fp16, [1, 12, 64, 1500]> attn_5_cast_fp16 = matmul(transpose_x = attn_5_transpose_x_0, transpose_y = attn_5_transpose_y_0, x = var_677_cast_fp16, y = var_675_cast_fp16)[name = tensor<string, []>("attn_5_cast_fp16")];`
377	`tensor<int32, [4]> var_680 = const()[name = tensor<string, []>("op_680"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
378	`tensor<fp16, [1, 768, 1, 1500]> input_17_cast_fp16 = reshape(shape = var_680, x = attn_5_cast_fp16)[name = tensor<string, []>("input_17_cast_fp16")];`
379	`tensor<string, []> var_690_pad_type_0 = const()[name = tensor<string, []>("op_690_pad_type_0"), val = tensor<string, []>("valid")];`
380	`tensor<int32, [2]> var_690_strides_0 = const()[name = tensor<string, []>("op_690_strides_0"), val = tensor<int32, [2]>([1, 1])];`
381	`tensor<int32, [4]> var_690_pad_0 = const()[name = tensor<string, []>("op_690_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
382	`tensor<int32, [2]> var_690_dilations_0 = const()[name = tensor<string, []>("op_690_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
383	`tensor<int32, []> var_690_groups_0 = const()[name = tensor<string, []>("op_690_groups_0"), val = tensor<int32, []>(1)];`
384	tensor<fp16, [768, 768, 1, 1]> layers_2_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17670784))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17965760))), name = tensor<string, []>("layers_2_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
385	`tensor<fp16, [768]> layers_2_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17965888)))];`
386	`tensor<fp16, [1, 768, 1, 1500]> var_690_cast_fp16 = conv(bias = layers_2_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_690_dilations_0, groups = var_690_groups_0, pad = var_690_pad_0, pad_type = var_690_pad_type_0, strides = var_690_strides_0, weight = layers_2_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_17_cast_fp16)[name = tensor<string, []>("op_690_cast_fp16")];`
387	`tensor<string, []> var_696_pad_type_0 = const()[name = tensor<string, []>("op_696_pad_type_0"), val = tensor<string, []>("valid")];`
388	`tensor<int32, [2]> var_696_strides_0 = const()[name = tensor<string, []>("op_696_strides_0"), val = tensor<int32, [2]>([1, 1])];`
389	`tensor<int32, [4]> var_696_pad_0 = const()[name = tensor<string, []>("op_696_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
390	`tensor<int32, [2]> var_696_dilations_0 = const()[name = tensor<string, []>("op_696_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
391	`tensor<int32, []> var_696_groups_0 = const()[name = tensor<string, []>("op_696_groups_0"), val = tensor<int32, []>(1)];`
392	tensor<fp16, [768, 768, 1, 1]> layers_2_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17976064))), name = tensor<string, []>("layers_2_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [4255]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17967488))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
393	`tensor<fp16, [1, 768, 1, 1500]> var_696_cast_fp16 = conv(dilations = var_696_dilations_0, groups = var_696_groups_0, pad = var_696_pad_0, pad_type = var_696_pad_type_0, strides = var_696_strides_0, weight = layers_2_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_17_cast_fp16)[name = tensor<string, []>("op_696_cast_fp16")];`
394	`tensor<fp16, [1, 768, 1, 1500]> obj_11_cast_fp16 = add(x = var_690_cast_fp16, y = var_696_cast_fp16)[name = tensor<string, []>("obj_11_cast_fp16")];`
395	`tensor<fp16, [1, 768, 1, 1500]> inputs_11_cast_fp16 = add(x = inputs_9_cast_fp16, y = obj_11_cast_fp16)[name = tensor<string, []>("inputs_11_cast_fp16")];`
396	`tensor<int32, [1]> out_11_axes_0 = const()[name = tensor<string, []>("out_11_axes_0"), val = tensor<int32, [1]>([1])];`
397	`tensor<fp16, []> var_707_to_fp16 = const()[name = tensor<string, []>("op_707_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
398	`tensor<fp16, [1, 768, 1, 1500]> out_11_cast_fp16 = layer_norm(axes = out_11_axes_0, epsilon = var_707_to_fp16, x = inputs_11_cast_fp16)[name = tensor<string, []>("out_11_cast_fp16")];`
399	`tensor<fp16, [768]> input_19_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_19_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(18049856)))];`
400	`tensor<fp16, [768]> input_19_beta_0_to_fp16 = const()[name = tensor<string, []>("input_19_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(18051456)))];`
401	`tensor<fp16, []> input_19_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_19_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
402	`tensor<fp16, [1, 768, 1, 1500]> input_19_cast_fp16 = batch_norm(beta = input_19_beta_0_to_fp16, epsilon = input_19_epsilon_0_to_fp16, gamma = input_19_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_11_cast_fp16)[name = tensor<string, []>("input_19_cast_fp16")];`
403	`tensor<string, []> var_725_pad_type_0 = const()[name = tensor<string, []>("op_725_pad_type_0"), val = tensor<string, []>("valid")];`
404	`tensor<int32, [2]> var_725_strides_0 = const()[name = tensor<string, []>("op_725_strides_0"), val = tensor<int32, [2]>([1, 1])];`
405	`tensor<int32, [4]> var_725_pad_0 = const()[name = tensor<string, []>("op_725_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
406	`tensor<int32, [2]> var_725_dilations_0 = const()[name = tensor<string, []>("op_725_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
407	`tensor<int32, []> var_725_groups_0 = const()[name = tensor<string, []>("op_725_groups_0"), val = tensor<int32, []>(1)];`
408	tensor<fp16, [3072, 768, 1, 1]> layers_2_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(18053056))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19232768))), name = tensor<string, []>("layers_2_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
409	`tensor<fp16, [3072]> layers_2_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19232896)))];`
410	`tensor<fp16, [1, 3072, 1, 1500]> var_725_cast_fp16 = conv(bias = layers_2_fc1_inlier_module_bias_to_fp16, dilations = var_725_dilations_0, groups = var_725_groups_0, pad = var_725_pad_0, pad_type = var_725_pad_type_0, strides = var_725_strides_0, weight = layers_2_fc1_inlier_module_weight_to_fp16_palettized, x = input_19_cast_fp16)[name = tensor<string, []>("op_725_cast_fp16")];`
411	`tensor<string, []> var_731_pad_type_0 = const()[name = tensor<string, []>("op_731_pad_type_0"), val = tensor<string, []>("valid")];`
412	`tensor<int32, [2]> var_731_strides_0 = const()[name = tensor<string, []>("op_731_strides_0"), val = tensor<int32, [2]>([1, 1])];`
413	`tensor<int32, [4]> var_731_pad_0 = const()[name = tensor<string, []>("op_731_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
414	`tensor<int32, [2]> var_731_dilations_0 = const()[name = tensor<string, []>("op_731_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
415	`tensor<int32, []> var_731_groups_0 = const()[name = tensor<string, []>("op_731_groups_0"), val = tensor<int32, []>(1)];`
416	tensor<fp16, [3072, 768, 1, 1]> layers_2_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19298752))), name = tensor<string, []>("layers_2_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [29780]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19239104))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
417	`tensor<fp16, [1, 3072, 1, 1500]> var_731_cast_fp16 = conv(dilations = var_731_dilations_0, groups = var_731_groups_0, pad = var_731_pad_0, pad_type = var_731_pad_type_0, strides = var_731_strides_0, weight = layers_2_fc1_outlier_module_weight_to_fp16_sparsified, x = input_19_cast_fp16)[name = tensor<string, []>("op_731_cast_fp16")];`
418	`tensor<fp16, [1, 3072, 1, 1500]> input_21_cast_fp16 = add(x = var_725_cast_fp16, y = var_731_cast_fp16)[name = tensor<string, []>("input_21_cast_fp16")];`
419	`tensor<string, []> input_23_mode_0 = const()[name = tensor<string, []>("input_23_mode_0"), val = tensor<string, []>("EXACT")];`
420	`tensor<fp16, [1, 3072, 1, 1500]> input_23_cast_fp16 = gelu(mode = input_23_mode_0, x = input_21_cast_fp16)[name = tensor<string, []>("input_23_cast_fp16")];`
421	`tensor<string, []> var_742_pad_type_0 = const()[name = tensor<string, []>("op_742_pad_type_0"), val = tensor<string, []>("valid")];`
422	`tensor<int32, [2]> var_742_strides_0 = const()[name = tensor<string, []>("op_742_strides_0"), val = tensor<int32, [2]>([1, 1])];`
423	`tensor<int32, [4]> var_742_pad_0 = const()[name = tensor<string, []>("op_742_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
424	`tensor<int32, [2]> var_742_dilations_0 = const()[name = tensor<string, []>("op_742_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
425	`tensor<int32, []> var_742_groups_0 = const()[name = tensor<string, []>("op_742_groups_0"), val = tensor<int32, []>(1)];`
426	tensor<fp16, [768, 3072, 1, 1]> layers_2_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(19593728))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20773440))), name = tensor<string, []>("layers_2_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
427	`tensor<fp16, [768]> layers_2_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20773568)))];`
428	`tensor<fp16, [1, 768, 1, 1500]> var_742_cast_fp16 = conv(bias = layers_2_fc2_inlier_module_bias_to_fp16, dilations = var_742_dilations_0, groups = var_742_groups_0, pad = var_742_pad_0, pad_type = var_742_pad_type_0, strides = var_742_strides_0, weight = layers_2_fc2_inlier_module_weight_to_fp16_palettized, x = input_23_cast_fp16)[name = tensor<string, []>("op_742_cast_fp16")];`
429	`tensor<string, []> var_748_pad_type_0 = const()[name = tensor<string, []>("op_748_pad_type_0"), val = tensor<string, []>("valid")];`
430	`tensor<int32, [2]> var_748_strides_0 = const()[name = tensor<string, []>("op_748_strides_0"), val = tensor<int32, [2]>([1, 1])];`
431	`tensor<int32, [4]> var_748_pad_0 = const()[name = tensor<string, []>("op_748_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
432	`tensor<int32, [2]> var_748_dilations_0 = const()[name = tensor<string, []>("op_748_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
433	`tensor<int32, []> var_748_groups_0 = const()[name = tensor<string, []>("op_748_groups_0"), val = tensor<int32, []>(1)];`
434	tensor<fp16, [768, 3072, 1, 1]> layers_2_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20834944))), name = tensor<string, []>("layers_2_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [29841]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20775168))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
435	`tensor<fp16, [1, 768, 1, 1500]> var_748_cast_fp16 = conv(dilations = var_748_dilations_0, groups = var_748_groups_0, pad = var_748_pad_0, pad_type = var_748_pad_type_0, strides = var_748_strides_0, weight = layers_2_fc2_outlier_module_weight_to_fp16_sparsified, x = input_23_cast_fp16)[name = tensor<string, []>("op_748_cast_fp16")];`
436	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_9_cast_fp16 = add(x = var_742_cast_fp16, y = var_748_cast_fp16)[name = tensor<string, []>("hidden_states_9_cast_fp16")];`
437	`tensor<fp16, [1, 768, 1, 1500]> inputs_13_cast_fp16 = add(x = inputs_11_cast_fp16, y = hidden_states_9_cast_fp16)[name = tensor<string, []>("inputs_13_cast_fp16")];`
438	`tensor<int32, []> var_754 = const()[name = tensor<string, []>("op_754"), val = tensor<int32, []>(3)];`
439	`tensor<int32, [1]> out_13_axes_0 = const()[name = tensor<string, []>("out_13_axes_0"), val = tensor<int32, [1]>([1])];`
440	`tensor<fp16, []> var_776_to_fp16 = const()[name = tensor<string, []>("op_776_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
441	`tensor<fp16, [1, 768, 1, 1500]> out_13_cast_fp16 = layer_norm(axes = out_13_axes_0, epsilon = var_776_to_fp16, x = inputs_13_cast_fp16)[name = tensor<string, []>("out_13_cast_fp16")];`
442	`tensor<fp16, [768]> obj_13_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_13_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21129920)))];`
443	`tensor<fp16, [768]> obj_13_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_13_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21131520)))];`
444	`tensor<fp16, []> obj_13_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_13_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
445	`tensor<fp16, [1, 768, 1, 1500]> obj_13_cast_fp16 = batch_norm(beta = obj_13_beta_0_to_fp16, epsilon = obj_13_epsilon_0_to_fp16, gamma = obj_13_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_13_cast_fp16)[name = tensor<string, []>("obj_13_cast_fp16")];`
446	`tensor<string, []> var_798_pad_type_0 = const()[name = tensor<string, []>("op_798_pad_type_0"), val = tensor<string, []>("valid")];`
447	`tensor<int32, [2]> var_798_strides_0 = const()[name = tensor<string, []>("op_798_strides_0"), val = tensor<int32, [2]>([1, 1])];`
448	`tensor<int32, [4]> var_798_pad_0 = const()[name = tensor<string, []>("op_798_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
449	`tensor<int32, [2]> var_798_dilations_0 = const()[name = tensor<string, []>("op_798_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
450	`tensor<int32, []> var_798_groups_0 = const()[name = tensor<string, []>("op_798_groups_0"), val = tensor<int32, []>(1)];`
451	tensor<fp16, [768, 768, 1, 1]> layers_3_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21133120))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21428096))), name = tensor<string, []>("layers_3_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
452	`tensor<fp16, [768]> layers_3_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21428224)))];`
453	`tensor<fp16, [1, 768, 1, 1500]> var_798_cast_fp16 = conv(bias = layers_3_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_798_dilations_0, groups = var_798_groups_0, pad = var_798_pad_0, pad_type = var_798_pad_type_0, strides = var_798_strides_0, weight = layers_3_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_13_cast_fp16)[name = tensor<string, []>("op_798_cast_fp16")];`
454	`tensor<string, []> var_804_pad_type_0 = const()[name = tensor<string, []>("op_804_pad_type_0"), val = tensor<string, []>("valid")];`
455	`tensor<int32, [2]> var_804_strides_0 = const()[name = tensor<string, []>("op_804_strides_0"), val = tensor<int32, [2]>([1, 1])];`
456	`tensor<int32, [4]> var_804_pad_0 = const()[name = tensor<string, []>("op_804_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
457	`tensor<int32, [2]> var_804_dilations_0 = const()[name = tensor<string, []>("op_804_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
458	`tensor<int32, []> var_804_groups_0 = const()[name = tensor<string, []>("op_804_groups_0"), val = tensor<int32, []>(1)];`
459	tensor<fp16, [768, 768, 1, 1]> layers_3_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21440384))), name = tensor<string, []>("layers_3_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5218]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21429824))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
460	`tensor<fp16, [1, 768, 1, 1500]> var_804_cast_fp16 = conv(dilations = var_804_dilations_0, groups = var_804_groups_0, pad = var_804_pad_0, pad_type = var_804_pad_type_0, strides = var_804_strides_0, weight = layers_3_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_13_cast_fp16)[name = tensor<string, []>("op_804_cast_fp16")];`
461	`tensor<fp16, [1, 768, 1, 1500]> query_7_cast_fp16 = add(x = var_798_cast_fp16, y = var_804_cast_fp16)[name = tensor<string, []>("query_7_cast_fp16")];`
462	`tensor<string, []> var_813_pad_type_0 = const()[name = tensor<string, []>("op_813_pad_type_0"), val = tensor<string, []>("valid")];`
463	`tensor<int32, [2]> var_813_strides_0 = const()[name = tensor<string, []>("op_813_strides_0"), val = tensor<int32, [2]>([1, 1])];`
464	`tensor<int32, [4]> var_813_pad_0 = const()[name = tensor<string, []>("op_813_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
465	`tensor<int32, [2]> var_813_dilations_0 = const()[name = tensor<string, []>("op_813_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
466	`tensor<int32, []> var_813_groups_0 = const()[name = tensor<string, []>("op_813_groups_0"), val = tensor<int32, []>(1)];`
467	tensor<fp16, [768, 768, 1, 1]> layers_3_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21514176))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21809152))), name = tensor<string, []>("layers_3_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
468	`tensor<fp16, [1, 768, 1, 1500]> var_813_cast_fp16 = conv(dilations = var_813_dilations_0, groups = var_813_groups_0, pad = var_813_pad_0, pad_type = var_813_pad_type_0, strides = var_813_strides_0, weight = layers_3_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_13_cast_fp16)[name = tensor<string, []>("op_813_cast_fp16")];`
469	`tensor<string, []> var_819_pad_type_0 = const()[name = tensor<string, []>("op_819_pad_type_0"), val = tensor<string, []>("valid")];`
470	`tensor<int32, [2]> var_819_strides_0 = const()[name = tensor<string, []>("op_819_strides_0"), val = tensor<int32, [2]>([1, 1])];`
471	`tensor<int32, [4]> var_819_pad_0 = const()[name = tensor<string, []>("op_819_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
472	`tensor<int32, [2]> var_819_dilations_0 = const()[name = tensor<string, []>("op_819_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
473	`tensor<int32, []> var_819_groups_0 = const()[name = tensor<string, []>("op_819_groups_0"), val = tensor<int32, []>(1)];`
474	tensor<fp16, [768, 768, 1, 1]> layers_3_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21819776))), name = tensor<string, []>("layers_3_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5203]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21809280))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
475	`tensor<fp16, [1, 768, 1, 1500]> var_819_cast_fp16 = conv(dilations = var_819_dilations_0, groups = var_819_groups_0, pad = var_819_pad_0, pad_type = var_819_pad_type_0, strides = var_819_strides_0, weight = layers_3_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_13_cast_fp16)[name = tensor<string, []>("op_819_cast_fp16")];`
476	`tensor<fp16, [1, 768, 1, 1500]> key_7_cast_fp16 = add(x = var_813_cast_fp16, y = var_819_cast_fp16)[name = tensor<string, []>("key_7_cast_fp16")];`
477	`tensor<string, []> var_829_pad_type_0 = const()[name = tensor<string, []>("op_829_pad_type_0"), val = tensor<string, []>("valid")];`
478	`tensor<int32, [2]> var_829_strides_0 = const()[name = tensor<string, []>("op_829_strides_0"), val = tensor<int32, [2]>([1, 1])];`
479	`tensor<int32, [4]> var_829_pad_0 = const()[name = tensor<string, []>("op_829_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
480	`tensor<int32, [2]> var_829_dilations_0 = const()[name = tensor<string, []>("op_829_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
481	`tensor<int32, []> var_829_groups_0 = const()[name = tensor<string, []>("op_829_groups_0"), val = tensor<int32, []>(1)];`
482	tensor<fp16, [768, 768, 1, 1]> layers_3_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(21893568))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22188544))), name = tensor<string, []>("layers_3_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
483	`tensor<fp16, [768]> layers_3_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22188672)))];`
484	`tensor<fp16, [1, 768, 1, 1500]> var_829_cast_fp16 = conv(bias = layers_3_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_829_dilations_0, groups = var_829_groups_0, pad = var_829_pad_0, pad_type = var_829_pad_type_0, strides = var_829_strides_0, weight = layers_3_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_13_cast_fp16)[name = tensor<string, []>("op_829_cast_fp16")];`
485	`tensor<string, []> var_835_pad_type_0 = const()[name = tensor<string, []>("op_835_pad_type_0"), val = tensor<string, []>("valid")];`
486	`tensor<int32, [2]> var_835_strides_0 = const()[name = tensor<string, []>("op_835_strides_0"), val = tensor<int32, [2]>([1, 1])];`
487	`tensor<int32, [4]> var_835_pad_0 = const()[name = tensor<string, []>("op_835_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
488	`tensor<int32, [2]> var_835_dilations_0 = const()[name = tensor<string, []>("op_835_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
489	`tensor<int32, []> var_835_groups_0 = const()[name = tensor<string, []>("op_835_groups_0"), val = tensor<int32, []>(1)];`
490	tensor<fp16, [768, 768, 1, 1]> layers_3_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22198784))), name = tensor<string, []>("layers_3_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [4222]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22190272))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
491	`tensor<fp16, [1, 768, 1, 1500]> var_835_cast_fp16 = conv(dilations = var_835_dilations_0, groups = var_835_groups_0, pad = var_835_pad_0, pad_type = var_835_pad_type_0, strides = var_835_strides_0, weight = layers_3_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_13_cast_fp16)[name = tensor<string, []>("op_835_cast_fp16")];`
492	`tensor<fp16, [1, 768, 1, 1500]> value_7_cast_fp16 = add(x = var_829_cast_fp16, y = var_835_cast_fp16)[name = tensor<string, []>("value_7_cast_fp16")];`
493	`tensor<int32, [4]> var_839 = const()[name = tensor<string, []>("op_839"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
494	`tensor<fp16, [1, 12, 64, 1500]> mh_q_7_cast_fp16 = reshape(shape = var_839, x = query_7_cast_fp16)[name = tensor<string, []>("mh_q_7_cast_fp16")];`
495	`tensor<fp16, []> var_841_to_fp16 = const()[name = tensor<string, []>("op_841_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
496	`tensor<fp16, [1, 12, 64, 1500]> var_842_cast_fp16 = mul(x = mh_q_7_cast_fp16, y = var_841_to_fp16)[name = tensor<string, []>("op_842_cast_fp16")];`
497	`tensor<int32, [4]> var_845 = const()[name = tensor<string, []>("op_845"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
498	`tensor<fp16, [1, 12, 64, 1500]> var_846_cast_fp16 = reshape(shape = var_845, x = key_7_cast_fp16)[name = tensor<string, []>("op_846_cast_fp16")];`
499	`tensor<bool, []> mh_w_7_transpose_x_0 = const()[name = tensor<string, []>("mh_w_7_transpose_x_0"), val = tensor<bool, []>(true)];`
500	`tensor<bool, []> mh_w_7_transpose_y_0 = const()[name = tensor<string, []>("mh_w_7_transpose_y_0"), val = tensor<bool, []>(false)];`
501	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_7_cast_fp16 = matmul(transpose_x = mh_w_7_transpose_x_0, transpose_y = mh_w_7_transpose_y_0, x = var_842_cast_fp16, y = var_846_cast_fp16)[name = tensor<string, []>("mh_w_7_cast_fp16")];`
502	`tensor<fp16, [1, 12, 1500, 1500]> var_849_cast_fp16 = softmax(axis = var_754, x = mh_w_7_cast_fp16)[name = tensor<string, []>("op_849_cast_fp16")];`
503	`tensor<int32, [4]> var_850 = const()[name = tensor<string, []>("op_850"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
504	`tensor<fp16, [1, 12, 64, 1500]> var_851_cast_fp16 = reshape(shape = var_850, x = value_7_cast_fp16)[name = tensor<string, []>("op_851_cast_fp16")];`
505	`tensor<bool, []> attn_7_transpose_x_0 = const()[name = tensor<string, []>("attn_7_transpose_x_0"), val = tensor<bool, []>(false)];`
506	`tensor<bool, []> attn_7_transpose_y_0 = const()[name = tensor<string, []>("attn_7_transpose_y_0"), val = tensor<bool, []>(true)];`
507	`tensor<fp16, [1, 12, 64, 1500]> attn_7_cast_fp16 = matmul(transpose_x = attn_7_transpose_x_0, transpose_y = attn_7_transpose_y_0, x = var_851_cast_fp16, y = var_849_cast_fp16)[name = tensor<string, []>("attn_7_cast_fp16")];`
508	`tensor<int32, [4]> var_854 = const()[name = tensor<string, []>("op_854"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
509	`tensor<fp16, [1, 768, 1, 1500]> input_25_cast_fp16 = reshape(shape = var_854, x = attn_7_cast_fp16)[name = tensor<string, []>("input_25_cast_fp16")];`
510	`tensor<string, []> var_864_pad_type_0 = const()[name = tensor<string, []>("op_864_pad_type_0"), val = tensor<string, []>("valid")];`
511	`tensor<int32, [2]> var_864_strides_0 = const()[name = tensor<string, []>("op_864_strides_0"), val = tensor<int32, [2]>([1, 1])];`
512	`tensor<int32, [4]> var_864_pad_0 = const()[name = tensor<string, []>("op_864_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
513	`tensor<int32, [2]> var_864_dilations_0 = const()[name = tensor<string, []>("op_864_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
514	`tensor<int32, []> var_864_groups_0 = const()[name = tensor<string, []>("op_864_groups_0"), val = tensor<int32, []>(1)];`
515	tensor<fp16, [768, 768, 1, 1]> layers_3_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22272576))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22567552))), name = tensor<string, []>("layers_3_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
516	`tensor<fp16, [768]> layers_3_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22567680)))];`
517	`tensor<fp16, [1, 768, 1, 1500]> var_864_cast_fp16 = conv(bias = layers_3_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_864_dilations_0, groups = var_864_groups_0, pad = var_864_pad_0, pad_type = var_864_pad_type_0, strides = var_864_strides_0, weight = layers_3_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_25_cast_fp16)[name = tensor<string, []>("op_864_cast_fp16")];`
518	`tensor<string, []> var_870_pad_type_0 = const()[name = tensor<string, []>("op_870_pad_type_0"), val = tensor<string, []>("valid")];`
519	`tensor<int32, [2]> var_870_strides_0 = const()[name = tensor<string, []>("op_870_strides_0"), val = tensor<int32, [2]>([1, 1])];`
520	`tensor<int32, [4]> var_870_pad_0 = const()[name = tensor<string, []>("op_870_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
521	`tensor<int32, [2]> var_870_dilations_0 = const()[name = tensor<string, []>("op_870_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
522	`tensor<int32, []> var_870_groups_0 = const()[name = tensor<string, []>("op_870_groups_0"), val = tensor<int32, []>(1)];`
523	tensor<fp16, [768, 768, 1, 1]> layers_3_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22576640))), name = tensor<string, []>("layers_3_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3641]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22569280))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
524	`tensor<fp16, [1, 768, 1, 1500]> var_870_cast_fp16 = conv(dilations = var_870_dilations_0, groups = var_870_groups_0, pad = var_870_pad_0, pad_type = var_870_pad_type_0, strides = var_870_strides_0, weight = layers_3_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_25_cast_fp16)[name = tensor<string, []>("op_870_cast_fp16")];`
525	`tensor<fp16, [1, 768, 1, 1500]> obj_15_cast_fp16 = add(x = var_864_cast_fp16, y = var_870_cast_fp16)[name = tensor<string, []>("obj_15_cast_fp16")];`
526	`tensor<fp16, [1, 768, 1, 1500]> inputs_15_cast_fp16 = add(x = inputs_13_cast_fp16, y = obj_15_cast_fp16)[name = tensor<string, []>("inputs_15_cast_fp16")];`
527	`tensor<int32, [1]> out_15_axes_0 = const()[name = tensor<string, []>("out_15_axes_0"), val = tensor<int32, [1]>([1])];`
528	`tensor<fp16, []> var_881_to_fp16 = const()[name = tensor<string, []>("op_881_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
529	`tensor<fp16, [1, 768, 1, 1500]> out_15_cast_fp16 = layer_norm(axes = out_15_axes_0, epsilon = var_881_to_fp16, x = inputs_15_cast_fp16)[name = tensor<string, []>("out_15_cast_fp16")];`
530	`tensor<fp16, [768]> input_27_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_27_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22650432)))];`
531	`tensor<fp16, [768]> input_27_beta_0_to_fp16 = const()[name = tensor<string, []>("input_27_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22652032)))];`
532	`tensor<fp16, []> input_27_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_27_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
533	`tensor<fp16, [1, 768, 1, 1500]> input_27_cast_fp16 = batch_norm(beta = input_27_beta_0_to_fp16, epsilon = input_27_epsilon_0_to_fp16, gamma = input_27_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_15_cast_fp16)[name = tensor<string, []>("input_27_cast_fp16")];`
534	`tensor<string, []> var_899_pad_type_0 = const()[name = tensor<string, []>("op_899_pad_type_0"), val = tensor<string, []>("valid")];`
535	`tensor<int32, [2]> var_899_strides_0 = const()[name = tensor<string, []>("op_899_strides_0"), val = tensor<int32, [2]>([1, 1])];`
536	`tensor<int32, [4]> var_899_pad_0 = const()[name = tensor<string, []>("op_899_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
537	`tensor<int32, [2]> var_899_dilations_0 = const()[name = tensor<string, []>("op_899_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
538	`tensor<int32, []> var_899_groups_0 = const()[name = tensor<string, []>("op_899_groups_0"), val = tensor<int32, []>(1)];`
539	tensor<fp16, [3072, 768, 1, 1]> layers_3_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22653632))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(23833344))), name = tensor<string, []>("layers_3_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
540	`tensor<fp16, [3072]> layers_3_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(23833472)))];`
541	`tensor<fp16, [1, 3072, 1, 1500]> var_899_cast_fp16 = conv(bias = layers_3_fc1_inlier_module_bias_to_fp16, dilations = var_899_dilations_0, groups = var_899_groups_0, pad = var_899_pad_0, pad_type = var_899_pad_type_0, strides = var_899_strides_0, weight = layers_3_fc1_inlier_module_weight_to_fp16_palettized, x = input_27_cast_fp16)[name = tensor<string, []>("op_899_cast_fp16")];`
542	`tensor<string, []> var_905_pad_type_0 = const()[name = tensor<string, []>("op_905_pad_type_0"), val = tensor<string, []>("valid")];`
543	`tensor<int32, [2]> var_905_strides_0 = const()[name = tensor<string, []>("op_905_strides_0"), val = tensor<int32, [2]>([1, 1])];`
544	`tensor<int32, [4]> var_905_pad_0 = const()[name = tensor<string, []>("op_905_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
545	`tensor<int32, [2]> var_905_dilations_0 = const()[name = tensor<string, []>("op_905_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
546	`tensor<int32, []> var_905_groups_0 = const()[name = tensor<string, []>("op_905_groups_0"), val = tensor<int32, []>(1)];`
547	tensor<fp16, [3072, 768, 1, 1]> layers_3_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(23883648))), name = tensor<string, []>("layers_3_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [21930]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(23839680))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
548	`tensor<fp16, [1, 3072, 1, 1500]> var_905_cast_fp16 = conv(dilations = var_905_dilations_0, groups = var_905_groups_0, pad = var_905_pad_0, pad_type = var_905_pad_type_0, strides = var_905_strides_0, weight = layers_3_fc1_outlier_module_weight_to_fp16_sparsified, x = input_27_cast_fp16)[name = tensor<string, []>("op_905_cast_fp16")];`
549	`tensor<fp16, [1, 3072, 1, 1500]> input_29_cast_fp16 = add(x = var_899_cast_fp16, y = var_905_cast_fp16)[name = tensor<string, []>("input_29_cast_fp16")];`
550	`tensor<string, []> input_31_mode_0 = const()[name = tensor<string, []>("input_31_mode_0"), val = tensor<string, []>("EXACT")];`
551	`tensor<fp16, [1, 3072, 1, 1500]> input_31_cast_fp16 = gelu(mode = input_31_mode_0, x = input_29_cast_fp16)[name = tensor<string, []>("input_31_cast_fp16")];`
552	`tensor<string, []> var_916_pad_type_0 = const()[name = tensor<string, []>("op_916_pad_type_0"), val = tensor<string, []>("valid")];`
553	`tensor<int32, [2]> var_916_strides_0 = const()[name = tensor<string, []>("op_916_strides_0"), val = tensor<int32, [2]>([1, 1])];`
554	`tensor<int32, [4]> var_916_pad_0 = const()[name = tensor<string, []>("op_916_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
555	`tensor<int32, [2]> var_916_dilations_0 = const()[name = tensor<string, []>("op_916_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
556	`tensor<int32, []> var_916_groups_0 = const()[name = tensor<string, []>("op_916_groups_0"), val = tensor<int32, []>(1)];`
557	tensor<fp16, [768, 3072, 1, 1]> layers_3_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(24178624))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25358336))), name = tensor<string, []>("layers_3_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
558	`tensor<fp16, [768]> layers_3_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25358464)))];`
559	`tensor<fp16, [1, 768, 1, 1500]> var_916_cast_fp16 = conv(bias = layers_3_fc2_inlier_module_bias_to_fp16, dilations = var_916_dilations_0, groups = var_916_groups_0, pad = var_916_pad_0, pad_type = var_916_pad_type_0, strides = var_916_strides_0, weight = layers_3_fc2_inlier_module_weight_to_fp16_palettized, x = input_31_cast_fp16)[name = tensor<string, []>("op_916_cast_fp16")];`
560	`tensor<string, []> var_922_pad_type_0 = const()[name = tensor<string, []>("op_922_pad_type_0"), val = tensor<string, []>("valid")];`
561	`tensor<int32, [2]> var_922_strides_0 = const()[name = tensor<string, []>("op_922_strides_0"), val = tensor<int32, [2]>([1, 1])];`
562	`tensor<int32, [4]> var_922_pad_0 = const()[name = tensor<string, []>("op_922_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
563	`tensor<int32, [2]> var_922_dilations_0 = const()[name = tensor<string, []>("op_922_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
564	`tensor<int32, []> var_922_groups_0 = const()[name = tensor<string, []>("op_922_groups_0"), val = tensor<int32, []>(1)];`
565	tensor<fp16, [768, 3072, 1, 1]> layers_3_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25407808))), name = tensor<string, []>("layers_3_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [23820]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25360064))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
566	`tensor<fp16, [1, 768, 1, 1500]> var_922_cast_fp16 = conv(dilations = var_922_dilations_0, groups = var_922_groups_0, pad = var_922_pad_0, pad_type = var_922_pad_type_0, strides = var_922_strides_0, weight = layers_3_fc2_outlier_module_weight_to_fp16_sparsified, x = input_31_cast_fp16)[name = tensor<string, []>("op_922_cast_fp16")];`
567	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_11_cast_fp16 = add(x = var_916_cast_fp16, y = var_922_cast_fp16)[name = tensor<string, []>("hidden_states_11_cast_fp16")];`
568	`tensor<fp16, [1, 768, 1, 1500]> inputs_17_cast_fp16 = add(x = inputs_15_cast_fp16, y = hidden_states_11_cast_fp16)[name = tensor<string, []>("inputs_17_cast_fp16")];`
569	`tensor<int32, []> var_928 = const()[name = tensor<string, []>("op_928"), val = tensor<int32, []>(3)];`
570	`tensor<int32, [1]> out_17_axes_0 = const()[name = tensor<string, []>("out_17_axes_0"), val = tensor<int32, [1]>([1])];`
571	`tensor<fp16, []> var_950_to_fp16 = const()[name = tensor<string, []>("op_950_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
572	`tensor<fp16, [1, 768, 1, 1500]> out_17_cast_fp16 = layer_norm(axes = out_17_axes_0, epsilon = var_950_to_fp16, x = inputs_17_cast_fp16)[name = tensor<string, []>("out_17_cast_fp16")];`
573	`tensor<fp16, [768]> obj_17_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_17_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25702784)))];`
574	`tensor<fp16, [768]> obj_17_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_17_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25704384)))];`
575	`tensor<fp16, []> obj_17_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_17_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
576	`tensor<fp16, [1, 768, 1, 1500]> obj_17_cast_fp16 = batch_norm(beta = obj_17_beta_0_to_fp16, epsilon = obj_17_epsilon_0_to_fp16, gamma = obj_17_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_17_cast_fp16)[name = tensor<string, []>("obj_17_cast_fp16")];`
577	`tensor<string, []> var_972_pad_type_0 = const()[name = tensor<string, []>("op_972_pad_type_0"), val = tensor<string, []>("valid")];`
578	`tensor<int32, [2]> var_972_strides_0 = const()[name = tensor<string, []>("op_972_strides_0"), val = tensor<int32, [2]>([1, 1])];`
579	`tensor<int32, [4]> var_972_pad_0 = const()[name = tensor<string, []>("op_972_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
580	`tensor<int32, [2]> var_972_dilations_0 = const()[name = tensor<string, []>("op_972_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
581	`tensor<int32, []> var_972_groups_0 = const()[name = tensor<string, []>("op_972_groups_0"), val = tensor<int32, []>(1)];`
582	tensor<fp16, [768, 768, 1, 1]> layers_4_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(25705984))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26000960))), name = tensor<string, []>("layers_4_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
583	`tensor<fp16, [768]> layers_4_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26001088)))];`
584	`tensor<fp16, [1, 768, 1, 1500]> var_972_cast_fp16 = conv(bias = layers_4_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_972_dilations_0, groups = var_972_groups_0, pad = var_972_pad_0, pad_type = var_972_pad_type_0, strides = var_972_strides_0, weight = layers_4_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_17_cast_fp16)[name = tensor<string, []>("op_972_cast_fp16")];`
585	`tensor<string, []> var_978_pad_type_0 = const()[name = tensor<string, []>("op_978_pad_type_0"), val = tensor<string, []>("valid")];`
586	`tensor<int32, [2]> var_978_strides_0 = const()[name = tensor<string, []>("op_978_strides_0"), val = tensor<int32, [2]>([1, 1])];`
587	`tensor<int32, [4]> var_978_pad_0 = const()[name = tensor<string, []>("op_978_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
588	`tensor<int32, [2]> var_978_dilations_0 = const()[name = tensor<string, []>("op_978_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
589	`tensor<int32, []> var_978_groups_0 = const()[name = tensor<string, []>("op_978_groups_0"), val = tensor<int32, []>(1)];`
590	tensor<fp16, [768, 768, 1, 1]> layers_4_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26012480))), name = tensor<string, []>("layers_4_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [4848]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26002688))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
591	`tensor<fp16, [1, 768, 1, 1500]> var_978_cast_fp16 = conv(dilations = var_978_dilations_0, groups = var_978_groups_0, pad = var_978_pad_0, pad_type = var_978_pad_type_0, strides = var_978_strides_0, weight = layers_4_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_17_cast_fp16)[name = tensor<string, []>("op_978_cast_fp16")];`
592	`tensor<fp16, [1, 768, 1, 1500]> query_9_cast_fp16 = add(x = var_972_cast_fp16, y = var_978_cast_fp16)[name = tensor<string, []>("query_9_cast_fp16")];`
593	`tensor<string, []> var_987_pad_type_0 = const()[name = tensor<string, []>("op_987_pad_type_0"), val = tensor<string, []>("valid")];`
594	`tensor<int32, [2]> var_987_strides_0 = const()[name = tensor<string, []>("op_987_strides_0"), val = tensor<int32, [2]>([1, 1])];`
595	`tensor<int32, [4]> var_987_pad_0 = const()[name = tensor<string, []>("op_987_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
596	`tensor<int32, [2]> var_987_dilations_0 = const()[name = tensor<string, []>("op_987_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
597	`tensor<int32, []> var_987_groups_0 = const()[name = tensor<string, []>("op_987_groups_0"), val = tensor<int32, []>(1)];`
598	tensor<fp16, [768, 768, 1, 1]> layers_4_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26086272))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26381248))), name = tensor<string, []>("layers_4_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
599	`tensor<fp16, [1, 768, 1, 1500]> var_987_cast_fp16 = conv(dilations = var_987_dilations_0, groups = var_987_groups_0, pad = var_987_pad_0, pad_type = var_987_pad_type_0, strides = var_987_strides_0, weight = layers_4_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_17_cast_fp16)[name = tensor<string, []>("op_987_cast_fp16")];`
600	`tensor<string, []> var_993_pad_type_0 = const()[name = tensor<string, []>("op_993_pad_type_0"), val = tensor<string, []>("valid")];`
601	`tensor<int32, [2]> var_993_strides_0 = const()[name = tensor<string, []>("op_993_strides_0"), val = tensor<int32, [2]>([1, 1])];`
602	`tensor<int32, [4]> var_993_pad_0 = const()[name = tensor<string, []>("op_993_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
603	`tensor<int32, [2]> var_993_dilations_0 = const()[name = tensor<string, []>("op_993_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
604	`tensor<int32, []> var_993_groups_0 = const()[name = tensor<string, []>("op_993_groups_0"), val = tensor<int32, []>(1)];`
605	tensor<fp16, [768, 768, 1, 1]> layers_4_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26392192))), name = tensor<string, []>("layers_4_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [5362]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26381376))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
606	`tensor<fp16, [1, 768, 1, 1500]> var_993_cast_fp16 = conv(dilations = var_993_dilations_0, groups = var_993_groups_0, pad = var_993_pad_0, pad_type = var_993_pad_type_0, strides = var_993_strides_0, weight = layers_4_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_17_cast_fp16)[name = tensor<string, []>("op_993_cast_fp16")];`
607	`tensor<fp16, [1, 768, 1, 1500]> key_9_cast_fp16 = add(x = var_987_cast_fp16, y = var_993_cast_fp16)[name = tensor<string, []>("key_9_cast_fp16")];`
608	`tensor<string, []> var_1003_pad_type_0 = const()[name = tensor<string, []>("op_1003_pad_type_0"), val = tensor<string, []>("valid")];`
609	`tensor<int32, [2]> var_1003_strides_0 = const()[name = tensor<string, []>("op_1003_strides_0"), val = tensor<int32, [2]>([1, 1])];`
610	`tensor<int32, [4]> var_1003_pad_0 = const()[name = tensor<string, []>("op_1003_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
611	`tensor<int32, [2]> var_1003_dilations_0 = const()[name = tensor<string, []>("op_1003_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
612	`tensor<int32, []> var_1003_groups_0 = const()[name = tensor<string, []>("op_1003_groups_0"), val = tensor<int32, []>(1)];`
613	tensor<fp16, [768, 768, 1, 1]> layers_4_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26465984))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26760960))), name = tensor<string, []>("layers_4_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
614	`tensor<fp16, [768]> layers_4_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26761088)))];`
615	`tensor<fp16, [1, 768, 1, 1500]> var_1003_cast_fp16 = conv(bias = layers_4_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_1003_dilations_0, groups = var_1003_groups_0, pad = var_1003_pad_0, pad_type = var_1003_pad_type_0, strides = var_1003_strides_0, weight = layers_4_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_17_cast_fp16)[name = tensor<string, []>("op_1003_cast_fp16")];`
616	`tensor<string, []> var_1009_pad_type_0 = const()[name = tensor<string, []>("op_1009_pad_type_0"), val = tensor<string, []>("valid")];`
617	`tensor<int32, [2]> var_1009_strides_0 = const()[name = tensor<string, []>("op_1009_strides_0"), val = tensor<int32, [2]>([1, 1])];`
618	`tensor<int32, [4]> var_1009_pad_0 = const()[name = tensor<string, []>("op_1009_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
619	`tensor<int32, [2]> var_1009_dilations_0 = const()[name = tensor<string, []>("op_1009_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
620	`tensor<int32, []> var_1009_groups_0 = const()[name = tensor<string, []>("op_1009_groups_0"), val = tensor<int32, []>(1)];`
621	tensor<fp16, [768, 768, 1, 1]> layers_4_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26769984))), name = tensor<string, []>("layers_4_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3606]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26762688))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
622	`tensor<fp16, [1, 768, 1, 1500]> var_1009_cast_fp16 = conv(dilations = var_1009_dilations_0, groups = var_1009_groups_0, pad = var_1009_pad_0, pad_type = var_1009_pad_type_0, strides = var_1009_strides_0, weight = layers_4_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_17_cast_fp16)[name = tensor<string, []>("op_1009_cast_fp16")];`
623	`tensor<fp16, [1, 768, 1, 1500]> value_9_cast_fp16 = add(x = var_1003_cast_fp16, y = var_1009_cast_fp16)[name = tensor<string, []>("value_9_cast_fp16")];`
624	`tensor<int32, [4]> var_1013 = const()[name = tensor<string, []>("op_1013"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
625	`tensor<fp16, [1, 12, 64, 1500]> mh_q_9_cast_fp16 = reshape(shape = var_1013, x = query_9_cast_fp16)[name = tensor<string, []>("mh_q_9_cast_fp16")];`
626	`tensor<fp16, []> var_1015_to_fp16 = const()[name = tensor<string, []>("op_1015_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
627	`tensor<fp16, [1, 12, 64, 1500]> var_1016_cast_fp16 = mul(x = mh_q_9_cast_fp16, y = var_1015_to_fp16)[name = tensor<string, []>("op_1016_cast_fp16")];`
628	`tensor<int32, [4]> var_1019 = const()[name = tensor<string, []>("op_1019"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
629	`tensor<fp16, [1, 12, 64, 1500]> var_1020_cast_fp16 = reshape(shape = var_1019, x = key_9_cast_fp16)[name = tensor<string, []>("op_1020_cast_fp16")];`
630	`tensor<bool, []> mh_w_9_transpose_x_0 = const()[name = tensor<string, []>("mh_w_9_transpose_x_0"), val = tensor<bool, []>(true)];`
631	`tensor<bool, []> mh_w_9_transpose_y_0 = const()[name = tensor<string, []>("mh_w_9_transpose_y_0"), val = tensor<bool, []>(false)];`
632	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_9_cast_fp16 = matmul(transpose_x = mh_w_9_transpose_x_0, transpose_y = mh_w_9_transpose_y_0, x = var_1016_cast_fp16, y = var_1020_cast_fp16)[name = tensor<string, []>("mh_w_9_cast_fp16")];`
633	`tensor<fp16, [1, 12, 1500, 1500]> var_1023_cast_fp16 = softmax(axis = var_928, x = mh_w_9_cast_fp16)[name = tensor<string, []>("op_1023_cast_fp16")];`
634	`tensor<int32, [4]> var_1024 = const()[name = tensor<string, []>("op_1024"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
635	`tensor<fp16, [1, 12, 64, 1500]> var_1025_cast_fp16 = reshape(shape = var_1024, x = value_9_cast_fp16)[name = tensor<string, []>("op_1025_cast_fp16")];`
636	`tensor<bool, []> attn_9_transpose_x_0 = const()[name = tensor<string, []>("attn_9_transpose_x_0"), val = tensor<bool, []>(false)];`
637	`tensor<bool, []> attn_9_transpose_y_0 = const()[name = tensor<string, []>("attn_9_transpose_y_0"), val = tensor<bool, []>(true)];`
638	`tensor<fp16, [1, 12, 64, 1500]> attn_9_cast_fp16 = matmul(transpose_x = attn_9_transpose_x_0, transpose_y = attn_9_transpose_y_0, x = var_1025_cast_fp16, y = var_1023_cast_fp16)[name = tensor<string, []>("attn_9_cast_fp16")];`
639	`tensor<int32, [4]> var_1028 = const()[name = tensor<string, []>("op_1028"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
640	`tensor<fp16, [1, 768, 1, 1500]> input_33_cast_fp16 = reshape(shape = var_1028, x = attn_9_cast_fp16)[name = tensor<string, []>("input_33_cast_fp16")];`
641	`tensor<string, []> var_1038_pad_type_0 = const()[name = tensor<string, []>("op_1038_pad_type_0"), val = tensor<string, []>("valid")];`
642	`tensor<int32, [2]> var_1038_strides_0 = const()[name = tensor<string, []>("op_1038_strides_0"), val = tensor<int32, [2]>([1, 1])];`
643	`tensor<int32, [4]> var_1038_pad_0 = const()[name = tensor<string, []>("op_1038_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
644	`tensor<int32, [2]> var_1038_dilations_0 = const()[name = tensor<string, []>("op_1038_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
645	`tensor<int32, []> var_1038_groups_0 = const()[name = tensor<string, []>("op_1038_groups_0"), val = tensor<int32, []>(1)];`
646	tensor<fp16, [768, 768, 1, 1]> layers_4_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26843776))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(27138752))), name = tensor<string, []>("layers_4_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
647	`tensor<fp16, [768]> layers_4_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(27138880)))];`
648	`tensor<fp16, [1, 768, 1, 1500]> var_1038_cast_fp16 = conv(bias = layers_4_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_1038_dilations_0, groups = var_1038_groups_0, pad = var_1038_pad_0, pad_type = var_1038_pad_type_0, strides = var_1038_strides_0, weight = layers_4_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_33_cast_fp16)[name = tensor<string, []>("op_1038_cast_fp16")];`
649	`tensor<string, []> var_1044_pad_type_0 = const()[name = tensor<string, []>("op_1044_pad_type_0"), val = tensor<string, []>("valid")];`
650	`tensor<int32, [2]> var_1044_strides_0 = const()[name = tensor<string, []>("op_1044_strides_0"), val = tensor<int32, [2]>([1, 1])];`
651	`tensor<int32, [4]> var_1044_pad_0 = const()[name = tensor<string, []>("op_1044_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
652	`tensor<int32, [2]> var_1044_dilations_0 = const()[name = tensor<string, []>("op_1044_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
653	`tensor<int32, []> var_1044_groups_0 = const()[name = tensor<string, []>("op_1044_groups_0"), val = tensor<int32, []>(1)];`
654	tensor<fp16, [768, 768, 1, 1]> layers_4_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(27146816))), name = tensor<string, []>("layers_4_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3133]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(27140480))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
655	`tensor<fp16, [1, 768, 1, 1500]> var_1044_cast_fp16 = conv(dilations = var_1044_dilations_0, groups = var_1044_groups_0, pad = var_1044_pad_0, pad_type = var_1044_pad_type_0, strides = var_1044_strides_0, weight = layers_4_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_33_cast_fp16)[name = tensor<string, []>("op_1044_cast_fp16")];`
656	`tensor<fp16, [1, 768, 1, 1500]> obj_19_cast_fp16 = add(x = var_1038_cast_fp16, y = var_1044_cast_fp16)[name = tensor<string, []>("obj_19_cast_fp16")];`
657	`tensor<fp16, [1, 768, 1, 1500]> inputs_19_cast_fp16 = add(x = inputs_17_cast_fp16, y = obj_19_cast_fp16)[name = tensor<string, []>("inputs_19_cast_fp16")];`
658	`tensor<int32, [1]> out_19_axes_0 = const()[name = tensor<string, []>("out_19_axes_0"), val = tensor<int32, [1]>([1])];`
659	`tensor<fp16, []> var_1055_to_fp16 = const()[name = tensor<string, []>("op_1055_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
660	`tensor<fp16, [1, 768, 1, 1500]> out_19_cast_fp16 = layer_norm(axes = out_19_axes_0, epsilon = var_1055_to_fp16, x = inputs_19_cast_fp16)[name = tensor<string, []>("out_19_cast_fp16")];`
661	`tensor<fp16, [768]> input_35_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_35_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(27220608)))];`
662	`tensor<fp16, [768]> input_35_beta_0_to_fp16 = const()[name = tensor<string, []>("input_35_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(27222208)))];`
663	`tensor<fp16, []> input_35_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_35_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
664	`tensor<fp16, [1, 768, 1, 1500]> input_35_cast_fp16 = batch_norm(beta = input_35_beta_0_to_fp16, epsilon = input_35_epsilon_0_to_fp16, gamma = input_35_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_19_cast_fp16)[name = tensor<string, []>("input_35_cast_fp16")];`
665	`tensor<string, []> var_1073_pad_type_0 = const()[name = tensor<string, []>("op_1073_pad_type_0"), val = tensor<string, []>("valid")];`
666	`tensor<int32, [2]> var_1073_strides_0 = const()[name = tensor<string, []>("op_1073_strides_0"), val = tensor<int32, [2]>([1, 1])];`
667	`tensor<int32, [4]> var_1073_pad_0 = const()[name = tensor<string, []>("op_1073_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
668	`tensor<int32, [2]> var_1073_dilations_0 = const()[name = tensor<string, []>("op_1073_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
669	`tensor<int32, []> var_1073_groups_0 = const()[name = tensor<string, []>("op_1073_groups_0"), val = tensor<int32, []>(1)];`
670	tensor<fp16, [3072, 768, 1, 1]> layers_4_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(27223808))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(28403520))), name = tensor<string, []>("layers_4_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
671	`tensor<fp16, [3072]> layers_4_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(28403648)))];`
672	`tensor<fp16, [1, 3072, 1, 1500]> var_1073_cast_fp16 = conv(bias = layers_4_fc1_inlier_module_bias_to_fp16, dilations = var_1073_dilations_0, groups = var_1073_groups_0, pad = var_1073_pad_0, pad_type = var_1073_pad_type_0, strides = var_1073_strides_0, weight = layers_4_fc1_inlier_module_weight_to_fp16_palettized, x = input_35_cast_fp16)[name = tensor<string, []>("op_1073_cast_fp16")];`
673	`tensor<string, []> var_1079_pad_type_0 = const()[name = tensor<string, []>("op_1079_pad_type_0"), val = tensor<string, []>("valid")];`
674	`tensor<int32, [2]> var_1079_strides_0 = const()[name = tensor<string, []>("op_1079_strides_0"), val = tensor<int32, [2]>([1, 1])];`
675	`tensor<int32, [4]> var_1079_pad_0 = const()[name = tensor<string, []>("op_1079_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
676	`tensor<int32, [2]> var_1079_dilations_0 = const()[name = tensor<string, []>("op_1079_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
677	`tensor<int32, []> var_1079_groups_0 = const()[name = tensor<string, []>("op_1079_groups_0"), val = tensor<int32, []>(1)];`
678	tensor<fp16, [3072, 768, 1, 1]> layers_4_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(28452288))), name = tensor<string, []>("layers_4_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [21163]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(28409856))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
679	`tensor<fp16, [1, 3072, 1, 1500]> var_1079_cast_fp16 = conv(dilations = var_1079_dilations_0, groups = var_1079_groups_0, pad = var_1079_pad_0, pad_type = var_1079_pad_type_0, strides = var_1079_strides_0, weight = layers_4_fc1_outlier_module_weight_to_fp16_sparsified, x = input_35_cast_fp16)[name = tensor<string, []>("op_1079_cast_fp16")];`
680	`tensor<fp16, [1, 3072, 1, 1500]> input_37_cast_fp16 = add(x = var_1073_cast_fp16, y = var_1079_cast_fp16)[name = tensor<string, []>("input_37_cast_fp16")];`
681	`tensor<string, []> input_39_mode_0 = const()[name = tensor<string, []>("input_39_mode_0"), val = tensor<string, []>("EXACT")];`
682	`tensor<fp16, [1, 3072, 1, 1500]> input_39_cast_fp16 = gelu(mode = input_39_mode_0, x = input_37_cast_fp16)[name = tensor<string, []>("input_39_cast_fp16")];`
683	`tensor<string, []> var_1090_pad_type_0 = const()[name = tensor<string, []>("op_1090_pad_type_0"), val = tensor<string, []>("valid")];`
684	`tensor<int32, [2]> var_1090_strides_0 = const()[name = tensor<string, []>("op_1090_strides_0"), val = tensor<int32, [2]>([1, 1])];`
685	`tensor<int32, [4]> var_1090_pad_0 = const()[name = tensor<string, []>("op_1090_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
686	`tensor<int32, [2]> var_1090_dilations_0 = const()[name = tensor<string, []>("op_1090_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
687	`tensor<int32, []> var_1090_groups_0 = const()[name = tensor<string, []>("op_1090_groups_0"), val = tensor<int32, []>(1)];`
688	tensor<fp16, [768, 3072, 1, 1]> layers_4_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(28747264))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(29926976))), name = tensor<string, []>("layers_4_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
689	`tensor<fp16, [768]> layers_4_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(29927104)))];`
690	`tensor<fp16, [1, 768, 1, 1500]> var_1090_cast_fp16 = conv(bias = layers_4_fc2_inlier_module_bias_to_fp16, dilations = var_1090_dilations_0, groups = var_1090_groups_0, pad = var_1090_pad_0, pad_type = var_1090_pad_type_0, strides = var_1090_strides_0, weight = layers_4_fc2_inlier_module_weight_to_fp16_palettized, x = input_39_cast_fp16)[name = tensor<string, []>("op_1090_cast_fp16")];`
691	`tensor<string, []> var_1096_pad_type_0 = const()[name = tensor<string, []>("op_1096_pad_type_0"), val = tensor<string, []>("valid")];`
692	`tensor<int32, [2]> var_1096_strides_0 = const()[name = tensor<string, []>("op_1096_strides_0"), val = tensor<int32, [2]>([1, 1])];`
693	`tensor<int32, [4]> var_1096_pad_0 = const()[name = tensor<string, []>("op_1096_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
694	`tensor<int32, [2]> var_1096_dilations_0 = const()[name = tensor<string, []>("op_1096_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
695	`tensor<int32, []> var_1096_groups_0 = const()[name = tensor<string, []>("op_1096_groups_0"), val = tensor<int32, []>(1)];`
696	tensor<fp16, [768, 3072, 1, 1]> layers_4_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(29977152))), name = tensor<string, []>("layers_4_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [24181]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(29928704))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
697	`tensor<fp16, [1, 768, 1, 1500]> var_1096_cast_fp16 = conv(dilations = var_1096_dilations_0, groups = var_1096_groups_0, pad = var_1096_pad_0, pad_type = var_1096_pad_type_0, strides = var_1096_strides_0, weight = layers_4_fc2_outlier_module_weight_to_fp16_sparsified, x = input_39_cast_fp16)[name = tensor<string, []>("op_1096_cast_fp16")];`
698	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_13_cast_fp16 = add(x = var_1090_cast_fp16, y = var_1096_cast_fp16)[name = tensor<string, []>("hidden_states_13_cast_fp16")];`
699	`tensor<fp16, [1, 768, 1, 1500]> inputs_21_cast_fp16 = add(x = inputs_19_cast_fp16, y = hidden_states_13_cast_fp16)[name = tensor<string, []>("inputs_21_cast_fp16")];`
700	`tensor<int32, []> var_1102 = const()[name = tensor<string, []>("op_1102"), val = tensor<int32, []>(3)];`
701	`tensor<int32, [1]> out_21_axes_0 = const()[name = tensor<string, []>("out_21_axes_0"), val = tensor<int32, [1]>([1])];`
702	`tensor<fp16, []> var_1124_to_fp16 = const()[name = tensor<string, []>("op_1124_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
703	`tensor<fp16, [1, 768, 1, 1500]> out_21_cast_fp16 = layer_norm(axes = out_21_axes_0, epsilon = var_1124_to_fp16, x = inputs_21_cast_fp16)[name = tensor<string, []>("out_21_cast_fp16")];`
704	`tensor<fp16, [768]> obj_21_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_21_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30272128)))];`
705	`tensor<fp16, [768]> obj_21_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_21_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30273728)))];`
706	`tensor<fp16, []> obj_21_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_21_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
707	`tensor<fp16, [1, 768, 1, 1500]> obj_21_cast_fp16 = batch_norm(beta = obj_21_beta_0_to_fp16, epsilon = obj_21_epsilon_0_to_fp16, gamma = obj_21_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_21_cast_fp16)[name = tensor<string, []>("obj_21_cast_fp16")];`
708	`tensor<string, []> var_1146_pad_type_0 = const()[name = tensor<string, []>("op_1146_pad_type_0"), val = tensor<string, []>("valid")];`
709	`tensor<int32, [2]> var_1146_strides_0 = const()[name = tensor<string, []>("op_1146_strides_0"), val = tensor<int32, [2]>([1, 1])];`
710	`tensor<int32, [4]> var_1146_pad_0 = const()[name = tensor<string, []>("op_1146_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
711	`tensor<int32, [2]> var_1146_dilations_0 = const()[name = tensor<string, []>("op_1146_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
712	`tensor<int32, []> var_1146_groups_0 = const()[name = tensor<string, []>("op_1146_groups_0"), val = tensor<int32, []>(1)];`
713	tensor<fp16, [768, 768, 1, 1]> layers_5_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30275328))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30570304))), name = tensor<string, []>("layers_5_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
714	`tensor<fp16, [768]> layers_5_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30570432)))];`
715	`tensor<fp16, [1, 768, 1, 1500]> var_1146_cast_fp16 = conv(bias = layers_5_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_1146_dilations_0, groups = var_1146_groups_0, pad = var_1146_pad_0, pad_type = var_1146_pad_type_0, strides = var_1146_strides_0, weight = layers_5_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_21_cast_fp16)[name = tensor<string, []>("op_1146_cast_fp16")];`
716	`tensor<string, []> var_1152_pad_type_0 = const()[name = tensor<string, []>("op_1152_pad_type_0"), val = tensor<string, []>("valid")];`
717	`tensor<int32, [2]> var_1152_strides_0 = const()[name = tensor<string, []>("op_1152_strides_0"), val = tensor<int32, [2]>([1, 1])];`
718	`tensor<int32, [4]> var_1152_pad_0 = const()[name = tensor<string, []>("op_1152_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
719	`tensor<int32, [2]> var_1152_dilations_0 = const()[name = tensor<string, []>("op_1152_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
720	`tensor<int32, []> var_1152_groups_0 = const()[name = tensor<string, []>("op_1152_groups_0"), val = tensor<int32, []>(1)];`
721	tensor<fp16, [768, 768, 1, 1]> layers_5_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30579968))), name = tensor<string, []>("layers_5_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3910]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30572032))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
722	`tensor<fp16, [1, 768, 1, 1500]> var_1152_cast_fp16 = conv(dilations = var_1152_dilations_0, groups = var_1152_groups_0, pad = var_1152_pad_0, pad_type = var_1152_pad_type_0, strides = var_1152_strides_0, weight = layers_5_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_21_cast_fp16)[name = tensor<string, []>("op_1152_cast_fp16")];`
723	`tensor<fp16, [1, 768, 1, 1500]> query_11_cast_fp16 = add(x = var_1146_cast_fp16, y = var_1152_cast_fp16)[name = tensor<string, []>("query_11_cast_fp16")];`
724	`tensor<string, []> var_1161_pad_type_0 = const()[name = tensor<string, []>("op_1161_pad_type_0"), val = tensor<string, []>("valid")];`
725	`tensor<int32, [2]> var_1161_strides_0 = const()[name = tensor<string, []>("op_1161_strides_0"), val = tensor<int32, [2]>([1, 1])];`
726	`tensor<int32, [4]> var_1161_pad_0 = const()[name = tensor<string, []>("op_1161_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
727	`tensor<int32, [2]> var_1161_dilations_0 = const()[name = tensor<string, []>("op_1161_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
728	`tensor<int32, []> var_1161_groups_0 = const()[name = tensor<string, []>("op_1161_groups_0"), val = tensor<int32, []>(1)];`
729	tensor<fp16, [768, 768, 1, 1]> layers_5_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30653760))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30948736))), name = tensor<string, []>("layers_5_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
730	`tensor<fp16, [1, 768, 1, 1500]> var_1161_cast_fp16 = conv(dilations = var_1161_dilations_0, groups = var_1161_groups_0, pad = var_1161_pad_0, pad_type = var_1161_pad_type_0, strides = var_1161_strides_0, weight = layers_5_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_21_cast_fp16)[name = tensor<string, []>("op_1161_cast_fp16")];`
731	`tensor<string, []> var_1167_pad_type_0 = const()[name = tensor<string, []>("op_1167_pad_type_0"), val = tensor<string, []>("valid")];`
732	`tensor<int32, [2]> var_1167_strides_0 = const()[name = tensor<string, []>("op_1167_strides_0"), val = tensor<int32, [2]>([1, 1])];`
733	`tensor<int32, [4]> var_1167_pad_0 = const()[name = tensor<string, []>("op_1167_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
734	`tensor<int32, [2]> var_1167_dilations_0 = const()[name = tensor<string, []>("op_1167_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
735	`tensor<int32, []> var_1167_groups_0 = const()[name = tensor<string, []>("op_1167_groups_0"), val = tensor<int32, []>(1)];`
736	tensor<fp16, [768, 768, 1, 1]> layers_5_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30957056))), name = tensor<string, []>("layers_5_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [4049]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30948864))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
737	`tensor<fp16, [1, 768, 1, 1500]> var_1167_cast_fp16 = conv(dilations = var_1167_dilations_0, groups = var_1167_groups_0, pad = var_1167_pad_0, pad_type = var_1167_pad_type_0, strides = var_1167_strides_0, weight = layers_5_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_21_cast_fp16)[name = tensor<string, []>("op_1167_cast_fp16")];`
738	`tensor<fp16, [1, 768, 1, 1500]> key_11_cast_fp16 = add(x = var_1161_cast_fp16, y = var_1167_cast_fp16)[name = tensor<string, []>("key_11_cast_fp16")];`
739	`tensor<string, []> var_1177_pad_type_0 = const()[name = tensor<string, []>("op_1177_pad_type_0"), val = tensor<string, []>("valid")];`
740	`tensor<int32, [2]> var_1177_strides_0 = const()[name = tensor<string, []>("op_1177_strides_0"), val = tensor<int32, [2]>([1, 1])];`
741	`tensor<int32, [4]> var_1177_pad_0 = const()[name = tensor<string, []>("op_1177_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
742	`tensor<int32, [2]> var_1177_dilations_0 = const()[name = tensor<string, []>("op_1177_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
743	`tensor<int32, []> var_1177_groups_0 = const()[name = tensor<string, []>("op_1177_groups_0"), val = tensor<int32, []>(1)];`
744	tensor<fp16, [768, 768, 1, 1]> layers_5_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31030848))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31325824))), name = tensor<string, []>("layers_5_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
745	`tensor<fp16, [768]> layers_5_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31325952)))];`
746	`tensor<fp16, [1, 768, 1, 1500]> var_1177_cast_fp16 = conv(bias = layers_5_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_1177_dilations_0, groups = var_1177_groups_0, pad = var_1177_pad_0, pad_type = var_1177_pad_type_0, strides = var_1177_strides_0, weight = layers_5_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_21_cast_fp16)[name = tensor<string, []>("op_1177_cast_fp16")];`
747	`tensor<string, []> var_1183_pad_type_0 = const()[name = tensor<string, []>("op_1183_pad_type_0"), val = tensor<string, []>("valid")];`
748	`tensor<int32, [2]> var_1183_strides_0 = const()[name = tensor<string, []>("op_1183_strides_0"), val = tensor<int32, [2]>([1, 1])];`
749	`tensor<int32, [4]> var_1183_pad_0 = const()[name = tensor<string, []>("op_1183_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
750	`tensor<int32, [2]> var_1183_dilations_0 = const()[name = tensor<string, []>("op_1183_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
751	`tensor<int32, []> var_1183_groups_0 = const()[name = tensor<string, []>("op_1183_groups_0"), val = tensor<int32, []>(1)];`
752	tensor<fp16, [768, 768, 1, 1]> layers_5_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31334976))), name = tensor<string, []>("layers_5_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3661]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31327552))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
753	`tensor<fp16, [1, 768, 1, 1500]> var_1183_cast_fp16 = conv(dilations = var_1183_dilations_0, groups = var_1183_groups_0, pad = var_1183_pad_0, pad_type = var_1183_pad_type_0, strides = var_1183_strides_0, weight = layers_5_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_21_cast_fp16)[name = tensor<string, []>("op_1183_cast_fp16")];`
754	`tensor<fp16, [1, 768, 1, 1500]> value_11_cast_fp16 = add(x = var_1177_cast_fp16, y = var_1183_cast_fp16)[name = tensor<string, []>("value_11_cast_fp16")];`
755	`tensor<int32, [4]> var_1187 = const()[name = tensor<string, []>("op_1187"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
756	`tensor<fp16, [1, 12, 64, 1500]> mh_q_11_cast_fp16 = reshape(shape = var_1187, x = query_11_cast_fp16)[name = tensor<string, []>("mh_q_11_cast_fp16")];`
757	`tensor<fp16, []> var_1189_to_fp16 = const()[name = tensor<string, []>("op_1189_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
758	`tensor<fp16, [1, 12, 64, 1500]> var_1190_cast_fp16 = mul(x = mh_q_11_cast_fp16, y = var_1189_to_fp16)[name = tensor<string, []>("op_1190_cast_fp16")];`
759	`tensor<int32, [4]> var_1193 = const()[name = tensor<string, []>("op_1193"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
760	`tensor<fp16, [1, 12, 64, 1500]> var_1194_cast_fp16 = reshape(shape = var_1193, x = key_11_cast_fp16)[name = tensor<string, []>("op_1194_cast_fp16")];`
761	`tensor<bool, []> mh_w_11_transpose_x_0 = const()[name = tensor<string, []>("mh_w_11_transpose_x_0"), val = tensor<bool, []>(true)];`
762	`tensor<bool, []> mh_w_11_transpose_y_0 = const()[name = tensor<string, []>("mh_w_11_transpose_y_0"), val = tensor<bool, []>(false)];`
763	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_11_cast_fp16 = matmul(transpose_x = mh_w_11_transpose_x_0, transpose_y = mh_w_11_transpose_y_0, x = var_1190_cast_fp16, y = var_1194_cast_fp16)[name = tensor<string, []>("mh_w_11_cast_fp16")];`
764	`tensor<fp16, [1, 12, 1500, 1500]> var_1197_cast_fp16 = softmax(axis = var_1102, x = mh_w_11_cast_fp16)[name = tensor<string, []>("op_1197_cast_fp16")];`
765	`tensor<int32, [4]> var_1198 = const()[name = tensor<string, []>("op_1198"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
766	`tensor<fp16, [1, 12, 64, 1500]> var_1199_cast_fp16 = reshape(shape = var_1198, x = value_11_cast_fp16)[name = tensor<string, []>("op_1199_cast_fp16")];`
767	`tensor<bool, []> attn_11_transpose_x_0 = const()[name = tensor<string, []>("attn_11_transpose_x_0"), val = tensor<bool, []>(false)];`
768	`tensor<bool, []> attn_11_transpose_y_0 = const()[name = tensor<string, []>("attn_11_transpose_y_0"), val = tensor<bool, []>(true)];`
769	`tensor<fp16, [1, 12, 64, 1500]> attn_11_cast_fp16 = matmul(transpose_x = attn_11_transpose_x_0, transpose_y = attn_11_transpose_y_0, x = var_1199_cast_fp16, y = var_1197_cast_fp16)[name = tensor<string, []>("attn_11_cast_fp16")];`
770	`tensor<int32, [4]> var_1202 = const()[name = tensor<string, []>("op_1202"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
771	`tensor<fp16, [1, 768, 1, 1500]> input_41_cast_fp16 = reshape(shape = var_1202, x = attn_11_cast_fp16)[name = tensor<string, []>("input_41_cast_fp16")];`
772	`tensor<string, []> var_1212_pad_type_0 = const()[name = tensor<string, []>("op_1212_pad_type_0"), val = tensor<string, []>("valid")];`
773	`tensor<int32, [2]> var_1212_strides_0 = const()[name = tensor<string, []>("op_1212_strides_0"), val = tensor<int32, [2]>([1, 1])];`
774	`tensor<int32, [4]> var_1212_pad_0 = const()[name = tensor<string, []>("op_1212_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
775	`tensor<int32, [2]> var_1212_dilations_0 = const()[name = tensor<string, []>("op_1212_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
776	`tensor<int32, []> var_1212_groups_0 = const()[name = tensor<string, []>("op_1212_groups_0"), val = tensor<int32, []>(1)];`
777	tensor<fp16, [768, 768, 1, 1]> layers_5_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31408768))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31703744))), name = tensor<string, []>("layers_5_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
778	`tensor<fp16, [768]> layers_5_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31703872)))];`
779	`tensor<fp16, [1, 768, 1, 1500]> var_1212_cast_fp16 = conv(bias = layers_5_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_1212_dilations_0, groups = var_1212_groups_0, pad = var_1212_pad_0, pad_type = var_1212_pad_type_0, strides = var_1212_strides_0, weight = layers_5_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_41_cast_fp16)[name = tensor<string, []>("op_1212_cast_fp16")];`
780	`tensor<string, []> var_1218_pad_type_0 = const()[name = tensor<string, []>("op_1218_pad_type_0"), val = tensor<string, []>("valid")];`
781	`tensor<int32, [2]> var_1218_strides_0 = const()[name = tensor<string, []>("op_1218_strides_0"), val = tensor<int32, [2]>([1, 1])];`
782	`tensor<int32, [4]> var_1218_pad_0 = const()[name = tensor<string, []>("op_1218_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
783	`tensor<int32, [2]> var_1218_dilations_0 = const()[name = tensor<string, []>("op_1218_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
784	`tensor<int32, []> var_1218_groups_0 = const()[name = tensor<string, []>("op_1218_groups_0"), val = tensor<int32, []>(1)];`
785	tensor<fp16, [768, 768, 1, 1]> layers_5_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31713792))), name = tensor<string, []>("layers_5_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [4128]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31705472))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
786	`tensor<fp16, [1, 768, 1, 1500]> var_1218_cast_fp16 = conv(dilations = var_1218_dilations_0, groups = var_1218_groups_0, pad = var_1218_pad_0, pad_type = var_1218_pad_type_0, strides = var_1218_strides_0, weight = layers_5_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_41_cast_fp16)[name = tensor<string, []>("op_1218_cast_fp16")];`
787	`tensor<fp16, [1, 768, 1, 1500]> obj_23_cast_fp16 = add(x = var_1212_cast_fp16, y = var_1218_cast_fp16)[name = tensor<string, []>("obj_23_cast_fp16")];`
788	`tensor<fp16, [1, 768, 1, 1500]> inputs_23_cast_fp16 = add(x = inputs_21_cast_fp16, y = obj_23_cast_fp16)[name = tensor<string, []>("inputs_23_cast_fp16")];`
789	`tensor<int32, [1]> out_23_axes_0 = const()[name = tensor<string, []>("out_23_axes_0"), val = tensor<int32, [1]>([1])];`
790	`tensor<fp16, []> var_1229_to_fp16 = const()[name = tensor<string, []>("op_1229_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
791	`tensor<fp16, [1, 768, 1, 1500]> out_23_cast_fp16 = layer_norm(axes = out_23_axes_0, epsilon = var_1229_to_fp16, x = inputs_23_cast_fp16)[name = tensor<string, []>("out_23_cast_fp16")];`
792	`tensor<fp16, [768]> input_43_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_43_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31787584)))];`
793	`tensor<fp16, [768]> input_43_beta_0_to_fp16 = const()[name = tensor<string, []>("input_43_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31789184)))];`
794	`tensor<fp16, []> input_43_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_43_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
795	`tensor<fp16, [1, 768, 1, 1500]> input_43_cast_fp16 = batch_norm(beta = input_43_beta_0_to_fp16, epsilon = input_43_epsilon_0_to_fp16, gamma = input_43_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_23_cast_fp16)[name = tensor<string, []>("input_43_cast_fp16")];`
796	`tensor<string, []> var_1247_pad_type_0 = const()[name = tensor<string, []>("op_1247_pad_type_0"), val = tensor<string, []>("valid")];`
797	`tensor<int32, [2]> var_1247_strides_0 = const()[name = tensor<string, []>("op_1247_strides_0"), val = tensor<int32, [2]>([1, 1])];`
798	`tensor<int32, [4]> var_1247_pad_0 = const()[name = tensor<string, []>("op_1247_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
799	`tensor<int32, [2]> var_1247_dilations_0 = const()[name = tensor<string, []>("op_1247_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
800	`tensor<int32, []> var_1247_groups_0 = const()[name = tensor<string, []>("op_1247_groups_0"), val = tensor<int32, []>(1)];`
801	tensor<fp16, [3072, 768, 1, 1]> layers_5_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(31790784))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(32970496))), name = tensor<string, []>("layers_5_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
802	`tensor<fp16, [3072]> layers_5_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(32970624)))];`
803	`tensor<fp16, [1, 3072, 1, 1500]> var_1247_cast_fp16 = conv(bias = layers_5_fc1_inlier_module_bias_to_fp16, dilations = var_1247_dilations_0, groups = var_1247_groups_0, pad = var_1247_pad_0, pad_type = var_1247_pad_type_0, strides = var_1247_strides_0, weight = layers_5_fc1_inlier_module_weight_to_fp16_palettized, x = input_43_cast_fp16)[name = tensor<string, []>("op_1247_cast_fp16")];`
804	`tensor<string, []> var_1253_pad_type_0 = const()[name = tensor<string, []>("op_1253_pad_type_0"), val = tensor<string, []>("valid")];`
805	`tensor<int32, [2]> var_1253_strides_0 = const()[name = tensor<string, []>("op_1253_strides_0"), val = tensor<int32, [2]>([1, 1])];`
806	`tensor<int32, [4]> var_1253_pad_0 = const()[name = tensor<string, []>("op_1253_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
807	`tensor<int32, [2]> var_1253_dilations_0 = const()[name = tensor<string, []>("op_1253_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
808	`tensor<int32, []> var_1253_groups_0 = const()[name = tensor<string, []>("op_1253_groups_0"), val = tensor<int32, []>(1)];`
809	tensor<fp16, [3072, 768, 1, 1]> layers_5_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(33018432))), name = tensor<string, []>("layers_5_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [20754]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(32976832))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
810	`tensor<fp16, [1, 3072, 1, 1500]> var_1253_cast_fp16 = conv(dilations = var_1253_dilations_0, groups = var_1253_groups_0, pad = var_1253_pad_0, pad_type = var_1253_pad_type_0, strides = var_1253_strides_0, weight = layers_5_fc1_outlier_module_weight_to_fp16_sparsified, x = input_43_cast_fp16)[name = tensor<string, []>("op_1253_cast_fp16")];`
811	`tensor<fp16, [1, 3072, 1, 1500]> input_45_cast_fp16 = add(x = var_1247_cast_fp16, y = var_1253_cast_fp16)[name = tensor<string, []>("input_45_cast_fp16")];`
812	`tensor<string, []> input_47_mode_0 = const()[name = tensor<string, []>("input_47_mode_0"), val = tensor<string, []>("EXACT")];`
813	`tensor<fp16, [1, 3072, 1, 1500]> input_47_cast_fp16 = gelu(mode = input_47_mode_0, x = input_45_cast_fp16)[name = tensor<string, []>("input_47_cast_fp16")];`
814	`tensor<string, []> var_1264_pad_type_0 = const()[name = tensor<string, []>("op_1264_pad_type_0"), val = tensor<string, []>("valid")];`
815	`tensor<int32, [2]> var_1264_strides_0 = const()[name = tensor<string, []>("op_1264_strides_0"), val = tensor<int32, [2]>([1, 1])];`
816	`tensor<int32, [4]> var_1264_pad_0 = const()[name = tensor<string, []>("op_1264_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
817	`tensor<int32, [2]> var_1264_dilations_0 = const()[name = tensor<string, []>("op_1264_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
818	`tensor<int32, []> var_1264_groups_0 = const()[name = tensor<string, []>("op_1264_groups_0"), val = tensor<int32, []>(1)];`
819	tensor<fp16, [768, 3072, 1, 1]> layers_5_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(33313408))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34493120))), name = tensor<string, []>("layers_5_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
820	`tensor<fp16, [768]> layers_5_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34493248)))];`
821	`tensor<fp16, [1, 768, 1, 1500]> var_1264_cast_fp16 = conv(bias = layers_5_fc2_inlier_module_bias_to_fp16, dilations = var_1264_dilations_0, groups = var_1264_groups_0, pad = var_1264_pad_0, pad_type = var_1264_pad_type_0, strides = var_1264_strides_0, weight = layers_5_fc2_inlier_module_weight_to_fp16_palettized, x = input_47_cast_fp16)[name = tensor<string, []>("op_1264_cast_fp16")];`
822	`tensor<string, []> var_1270_pad_type_0 = const()[name = tensor<string, []>("op_1270_pad_type_0"), val = tensor<string, []>("valid")];`
823	`tensor<int32, [2]> var_1270_strides_0 = const()[name = tensor<string, []>("op_1270_strides_0"), val = tensor<int32, [2]>([1, 1])];`
824	`tensor<int32, [4]> var_1270_pad_0 = const()[name = tensor<string, []>("op_1270_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
825	`tensor<int32, [2]> var_1270_dilations_0 = const()[name = tensor<string, []>("op_1270_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
826	`tensor<int32, []> var_1270_groups_0 = const()[name = tensor<string, []>("op_1270_groups_0"), val = tensor<int32, []>(1)];`
827	tensor<fp16, [768, 3072, 1, 1]> layers_5_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34539520))), name = tensor<string, []>("layers_5_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [22280]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34494848))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
828	`tensor<fp16, [1, 768, 1, 1500]> var_1270_cast_fp16 = conv(dilations = var_1270_dilations_0, groups = var_1270_groups_0, pad = var_1270_pad_0, pad_type = var_1270_pad_type_0, strides = var_1270_strides_0, weight = layers_5_fc2_outlier_module_weight_to_fp16_sparsified, x = input_47_cast_fp16)[name = tensor<string, []>("op_1270_cast_fp16")];`
829	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_15_cast_fp16 = add(x = var_1264_cast_fp16, y = var_1270_cast_fp16)[name = tensor<string, []>("hidden_states_15_cast_fp16")];`
830	`tensor<fp16, [1, 768, 1, 1500]> inputs_25_cast_fp16 = add(x = inputs_23_cast_fp16, y = hidden_states_15_cast_fp16)[name = tensor<string, []>("inputs_25_cast_fp16")];`
831	`tensor<int32, []> var_1276 = const()[name = tensor<string, []>("op_1276"), val = tensor<int32, []>(3)];`
832	`tensor<int32, [1]> out_25_axes_0 = const()[name = tensor<string, []>("out_25_axes_0"), val = tensor<int32, [1]>([1])];`
833	`tensor<fp16, []> var_1298_to_fp16 = const()[name = tensor<string, []>("op_1298_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
834	`tensor<fp16, [1, 768, 1, 1500]> out_25_cast_fp16 = layer_norm(axes = out_25_axes_0, epsilon = var_1298_to_fp16, x = inputs_25_cast_fp16)[name = tensor<string, []>("out_25_cast_fp16")];`
835	`tensor<fp16, [768]> obj_25_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_25_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34834496)))];`
836	`tensor<fp16, [768]> obj_25_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_25_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34836096)))];`
837	`tensor<fp16, []> obj_25_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_25_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
838	`tensor<fp16, [1, 768, 1, 1500]> obj_25_cast_fp16 = batch_norm(beta = obj_25_beta_0_to_fp16, epsilon = obj_25_epsilon_0_to_fp16, gamma = obj_25_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_25_cast_fp16)[name = tensor<string, []>("obj_25_cast_fp16")];`
839	`tensor<string, []> var_1320_pad_type_0 = const()[name = tensor<string, []>("op_1320_pad_type_0"), val = tensor<string, []>("valid")];`
840	`tensor<int32, [2]> var_1320_strides_0 = const()[name = tensor<string, []>("op_1320_strides_0"), val = tensor<int32, [2]>([1, 1])];`
841	`tensor<int32, [4]> var_1320_pad_0 = const()[name = tensor<string, []>("op_1320_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
842	`tensor<int32, [2]> var_1320_dilations_0 = const()[name = tensor<string, []>("op_1320_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
843	`tensor<int32, []> var_1320_groups_0 = const()[name = tensor<string, []>("op_1320_groups_0"), val = tensor<int32, []>(1)];`
844	tensor<fp16, [768, 768, 1, 1]> layers_6_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34837696))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35132672))), name = tensor<string, []>("layers_6_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
845	`tensor<fp16, [768]> layers_6_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_6_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35132800)))];`
846	`tensor<fp16, [1, 768, 1, 1500]> var_1320_cast_fp16 = conv(bias = layers_6_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_1320_dilations_0, groups = var_1320_groups_0, pad = var_1320_pad_0, pad_type = var_1320_pad_type_0, strides = var_1320_strides_0, weight = layers_6_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_25_cast_fp16)[name = tensor<string, []>("op_1320_cast_fp16")];`
847	`tensor<string, []> var_1326_pad_type_0 = const()[name = tensor<string, []>("op_1326_pad_type_0"), val = tensor<string, []>("valid")];`
848	`tensor<int32, [2]> var_1326_strides_0 = const()[name = tensor<string, []>("op_1326_strides_0"), val = tensor<int32, [2]>([1, 1])];`
849	`tensor<int32, [4]> var_1326_pad_0 = const()[name = tensor<string, []>("op_1326_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
850	`tensor<int32, [2]> var_1326_dilations_0 = const()[name = tensor<string, []>("op_1326_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
851	`tensor<int32, []> var_1326_groups_0 = const()[name = tensor<string, []>("op_1326_groups_0"), val = tensor<int32, []>(1)];`
852	tensor<fp16, [768, 768, 1, 1]> layers_6_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35142208))), name = tensor<string, []>("layers_6_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3870]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35134400))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
853	`tensor<fp16, [1, 768, 1, 1500]> var_1326_cast_fp16 = conv(dilations = var_1326_dilations_0, groups = var_1326_groups_0, pad = var_1326_pad_0, pad_type = var_1326_pad_type_0, strides = var_1326_strides_0, weight = layers_6_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_25_cast_fp16)[name = tensor<string, []>("op_1326_cast_fp16")];`
854	`tensor<fp16, [1, 768, 1, 1500]> query_13_cast_fp16 = add(x = var_1320_cast_fp16, y = var_1326_cast_fp16)[name = tensor<string, []>("query_13_cast_fp16")];`
855	`tensor<string, []> var_1335_pad_type_0 = const()[name = tensor<string, []>("op_1335_pad_type_0"), val = tensor<string, []>("valid")];`
856	`tensor<int32, [2]> var_1335_strides_0 = const()[name = tensor<string, []>("op_1335_strides_0"), val = tensor<int32, [2]>([1, 1])];`
857	`tensor<int32, [4]> var_1335_pad_0 = const()[name = tensor<string, []>("op_1335_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
858	`tensor<int32, [2]> var_1335_dilations_0 = const()[name = tensor<string, []>("op_1335_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
859	`tensor<int32, []> var_1335_groups_0 = const()[name = tensor<string, []>("op_1335_groups_0"), val = tensor<int32, []>(1)];`
860	tensor<fp16, [768, 768, 1, 1]> layers_6_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35216000))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35510976))), name = tensor<string, []>("layers_6_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
861	`tensor<fp16, [1, 768, 1, 1500]> var_1335_cast_fp16 = conv(dilations = var_1335_dilations_0, groups = var_1335_groups_0, pad = var_1335_pad_0, pad_type = var_1335_pad_type_0, strides = var_1335_strides_0, weight = layers_6_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_25_cast_fp16)[name = tensor<string, []>("op_1335_cast_fp16")];`
862	`tensor<string, []> var_1341_pad_type_0 = const()[name = tensor<string, []>("op_1341_pad_type_0"), val = tensor<string, []>("valid")];`
863	`tensor<int32, [2]> var_1341_strides_0 = const()[name = tensor<string, []>("op_1341_strides_0"), val = tensor<int32, [2]>([1, 1])];`
864	`tensor<int32, [4]> var_1341_pad_0 = const()[name = tensor<string, []>("op_1341_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
865	`tensor<int32, [2]> var_1341_dilations_0 = const()[name = tensor<string, []>("op_1341_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
866	`tensor<int32, []> var_1341_groups_0 = const()[name = tensor<string, []>("op_1341_groups_0"), val = tensor<int32, []>(1)];`
867	tensor<fp16, [768, 768, 1, 1]> layers_6_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35518848))), name = tensor<string, []>("layers_6_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3809]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35511104))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
868	`tensor<fp16, [1, 768, 1, 1500]> var_1341_cast_fp16 = conv(dilations = var_1341_dilations_0, groups = var_1341_groups_0, pad = var_1341_pad_0, pad_type = var_1341_pad_type_0, strides = var_1341_strides_0, weight = layers_6_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_25_cast_fp16)[name = tensor<string, []>("op_1341_cast_fp16")];`
869	`tensor<fp16, [1, 768, 1, 1500]> key_13_cast_fp16 = add(x = var_1335_cast_fp16, y = var_1341_cast_fp16)[name = tensor<string, []>("key_13_cast_fp16")];`
870	`tensor<string, []> var_1351_pad_type_0 = const()[name = tensor<string, []>("op_1351_pad_type_0"), val = tensor<string, []>("valid")];`
871	`tensor<int32, [2]> var_1351_strides_0 = const()[name = tensor<string, []>("op_1351_strides_0"), val = tensor<int32, [2]>([1, 1])];`
872	`tensor<int32, [4]> var_1351_pad_0 = const()[name = tensor<string, []>("op_1351_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
873	`tensor<int32, [2]> var_1351_dilations_0 = const()[name = tensor<string, []>("op_1351_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
874	`tensor<int32, []> var_1351_groups_0 = const()[name = tensor<string, []>("op_1351_groups_0"), val = tensor<int32, []>(1)];`
875	tensor<fp16, [768, 768, 1, 1]> layers_6_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35592640))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35887616))), name = tensor<string, []>("layers_6_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
876	`tensor<fp16, [768]> layers_6_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_6_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35887744)))];`
877	`tensor<fp16, [1, 768, 1, 1500]> var_1351_cast_fp16 = conv(bias = layers_6_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_1351_dilations_0, groups = var_1351_groups_0, pad = var_1351_pad_0, pad_type = var_1351_pad_type_0, strides = var_1351_strides_0, weight = layers_6_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_25_cast_fp16)[name = tensor<string, []>("op_1351_cast_fp16")];`
878	`tensor<string, []> var_1357_pad_type_0 = const()[name = tensor<string, []>("op_1357_pad_type_0"), val = tensor<string, []>("valid")];`
879	`tensor<int32, [2]> var_1357_strides_0 = const()[name = tensor<string, []>("op_1357_strides_0"), val = tensor<int32, [2]>([1, 1])];`
880	`tensor<int32, [4]> var_1357_pad_0 = const()[name = tensor<string, []>("op_1357_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
881	`tensor<int32, [2]> var_1357_dilations_0 = const()[name = tensor<string, []>("op_1357_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
882	`tensor<int32, []> var_1357_groups_0 = const()[name = tensor<string, []>("op_1357_groups_0"), val = tensor<int32, []>(1)];`
883	tensor<fp16, [768, 768, 1, 1]> layers_6_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35895296))), name = tensor<string, []>("layers_6_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [2927]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35889344))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
884	`tensor<fp16, [1, 768, 1, 1500]> var_1357_cast_fp16 = conv(dilations = var_1357_dilations_0, groups = var_1357_groups_0, pad = var_1357_pad_0, pad_type = var_1357_pad_type_0, strides = var_1357_strides_0, weight = layers_6_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_25_cast_fp16)[name = tensor<string, []>("op_1357_cast_fp16")];`
885	`tensor<fp16, [1, 768, 1, 1500]> value_13_cast_fp16 = add(x = var_1351_cast_fp16, y = var_1357_cast_fp16)[name = tensor<string, []>("value_13_cast_fp16")];`
886	`tensor<int32, [4]> var_1361 = const()[name = tensor<string, []>("op_1361"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
887	`tensor<fp16, [1, 12, 64, 1500]> mh_q_13_cast_fp16 = reshape(shape = var_1361, x = query_13_cast_fp16)[name = tensor<string, []>("mh_q_13_cast_fp16")];`
888	`tensor<fp16, []> var_1363_to_fp16 = const()[name = tensor<string, []>("op_1363_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
889	`tensor<fp16, [1, 12, 64, 1500]> var_1364_cast_fp16 = mul(x = mh_q_13_cast_fp16, y = var_1363_to_fp16)[name = tensor<string, []>("op_1364_cast_fp16")];`
890	`tensor<int32, [4]> var_1367 = const()[name = tensor<string, []>("op_1367"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
891	`tensor<fp16, [1, 12, 64, 1500]> var_1368_cast_fp16 = reshape(shape = var_1367, x = key_13_cast_fp16)[name = tensor<string, []>("op_1368_cast_fp16")];`
892	`tensor<bool, []> mh_w_13_transpose_x_0 = const()[name = tensor<string, []>("mh_w_13_transpose_x_0"), val = tensor<bool, []>(true)];`
893	`tensor<bool, []> mh_w_13_transpose_y_0 = const()[name = tensor<string, []>("mh_w_13_transpose_y_0"), val = tensor<bool, []>(false)];`
894	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_13_cast_fp16 = matmul(transpose_x = mh_w_13_transpose_x_0, transpose_y = mh_w_13_transpose_y_0, x = var_1364_cast_fp16, y = var_1368_cast_fp16)[name = tensor<string, []>("mh_w_13_cast_fp16")];`
895	`tensor<fp16, [1, 12, 1500, 1500]> var_1371_cast_fp16 = softmax(axis = var_1276, x = mh_w_13_cast_fp16)[name = tensor<string, []>("op_1371_cast_fp16")];`
896	`tensor<int32, [4]> var_1372 = const()[name = tensor<string, []>("op_1372"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
897	`tensor<fp16, [1, 12, 64, 1500]> var_1373_cast_fp16 = reshape(shape = var_1372, x = value_13_cast_fp16)[name = tensor<string, []>("op_1373_cast_fp16")];`
898	`tensor<bool, []> attn_13_transpose_x_0 = const()[name = tensor<string, []>("attn_13_transpose_x_0"), val = tensor<bool, []>(false)];`
899	`tensor<bool, []> attn_13_transpose_y_0 = const()[name = tensor<string, []>("attn_13_transpose_y_0"), val = tensor<bool, []>(true)];`
900	`tensor<fp16, [1, 12, 64, 1500]> attn_13_cast_fp16 = matmul(transpose_x = attn_13_transpose_x_0, transpose_y = attn_13_transpose_y_0, x = var_1373_cast_fp16, y = var_1371_cast_fp16)[name = tensor<string, []>("attn_13_cast_fp16")];`
901	`tensor<int32, [4]> var_1376 = const()[name = tensor<string, []>("op_1376"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
902	`tensor<fp16, [1, 768, 1, 1500]> input_49_cast_fp16 = reshape(shape = var_1376, x = attn_13_cast_fp16)[name = tensor<string, []>("input_49_cast_fp16")];`
903	`tensor<string, []> var_1386_pad_type_0 = const()[name = tensor<string, []>("op_1386_pad_type_0"), val = tensor<string, []>("valid")];`
904	`tensor<int32, [2]> var_1386_strides_0 = const()[name = tensor<string, []>("op_1386_strides_0"), val = tensor<int32, [2]>([1, 1])];`
905	`tensor<int32, [4]> var_1386_pad_0 = const()[name = tensor<string, []>("op_1386_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
906	`tensor<int32, [2]> var_1386_dilations_0 = const()[name = tensor<string, []>("op_1386_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
907	`tensor<int32, []> var_1386_groups_0 = const()[name = tensor<string, []>("op_1386_groups_0"), val = tensor<int32, []>(1)];`
908	tensor<fp16, [768, 768, 1, 1]> layers_6_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35969088))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36264064))), name = tensor<string, []>("layers_6_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
909	`tensor<fp16, [768]> layers_6_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_6_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36264192)))];`
910	`tensor<fp16, [1, 768, 1, 1500]> var_1386_cast_fp16 = conv(bias = layers_6_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_1386_dilations_0, groups = var_1386_groups_0, pad = var_1386_pad_0, pad_type = var_1386_pad_type_0, strides = var_1386_strides_0, weight = layers_6_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_49_cast_fp16)[name = tensor<string, []>("op_1386_cast_fp16")];`
911	`tensor<string, []> var_1392_pad_type_0 = const()[name = tensor<string, []>("op_1392_pad_type_0"), val = tensor<string, []>("valid")];`
912	`tensor<int32, [2]> var_1392_strides_0 = const()[name = tensor<string, []>("op_1392_strides_0"), val = tensor<int32, [2]>([1, 1])];`
913	`tensor<int32, [4]> var_1392_pad_0 = const()[name = tensor<string, []>("op_1392_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
914	`tensor<int32, [2]> var_1392_dilations_0 = const()[name = tensor<string, []>("op_1392_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
915	`tensor<int32, []> var_1392_groups_0 = const()[name = tensor<string, []>("op_1392_groups_0"), val = tensor<int32, []>(1)];`
916	tensor<fp16, [768, 768, 1, 1]> layers_6_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36270720))), name = tensor<string, []>("layers_6_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [2412]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36265792))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
917	`tensor<fp16, [1, 768, 1, 1500]> var_1392_cast_fp16 = conv(dilations = var_1392_dilations_0, groups = var_1392_groups_0, pad = var_1392_pad_0, pad_type = var_1392_pad_type_0, strides = var_1392_strides_0, weight = layers_6_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_49_cast_fp16)[name = tensor<string, []>("op_1392_cast_fp16")];`
918	`tensor<fp16, [1, 768, 1, 1500]> obj_27_cast_fp16 = add(x = var_1386_cast_fp16, y = var_1392_cast_fp16)[name = tensor<string, []>("obj_27_cast_fp16")];`
919	`tensor<fp16, [1, 768, 1, 1500]> inputs_27_cast_fp16 = add(x = inputs_25_cast_fp16, y = obj_27_cast_fp16)[name = tensor<string, []>("inputs_27_cast_fp16")];`
920	`tensor<int32, [1]> out_27_axes_0 = const()[name = tensor<string, []>("out_27_axes_0"), val = tensor<int32, [1]>([1])];`
921	`tensor<fp16, []> var_1403_to_fp16 = const()[name = tensor<string, []>("op_1403_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
922	`tensor<fp16, [1, 768, 1, 1500]> out_27_cast_fp16 = layer_norm(axes = out_27_axes_0, epsilon = var_1403_to_fp16, x = inputs_27_cast_fp16)[name = tensor<string, []>("out_27_cast_fp16")];`
923	`tensor<fp16, [768]> input_51_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_51_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36344512)))];`
924	`tensor<fp16, [768]> input_51_beta_0_to_fp16 = const()[name = tensor<string, []>("input_51_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36346112)))];`
925	`tensor<fp16, []> input_51_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_51_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
926	`tensor<fp16, [1, 768, 1, 1500]> input_51_cast_fp16 = batch_norm(beta = input_51_beta_0_to_fp16, epsilon = input_51_epsilon_0_to_fp16, gamma = input_51_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_27_cast_fp16)[name = tensor<string, []>("input_51_cast_fp16")];`
927	`tensor<string, []> var_1421_pad_type_0 = const()[name = tensor<string, []>("op_1421_pad_type_0"), val = tensor<string, []>("valid")];`
928	`tensor<int32, [2]> var_1421_strides_0 = const()[name = tensor<string, []>("op_1421_strides_0"), val = tensor<int32, [2]>([1, 1])];`
929	`tensor<int32, [4]> var_1421_pad_0 = const()[name = tensor<string, []>("op_1421_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
930	`tensor<int32, [2]> var_1421_dilations_0 = const()[name = tensor<string, []>("op_1421_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
931	`tensor<int32, []> var_1421_groups_0 = const()[name = tensor<string, []>("op_1421_groups_0"), val = tensor<int32, []>(1)];`
932	tensor<fp16, [3072, 768, 1, 1]> layers_6_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36347712))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(37527424))), name = tensor<string, []>("layers_6_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
933	`tensor<fp16, [3072]> layers_6_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_6_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(37527552)))];`
934	`tensor<fp16, [1, 3072, 1, 1500]> var_1421_cast_fp16 = conv(bias = layers_6_fc1_inlier_module_bias_to_fp16, dilations = var_1421_dilations_0, groups = var_1421_groups_0, pad = var_1421_pad_0, pad_type = var_1421_pad_type_0, strides = var_1421_strides_0, weight = layers_6_fc1_inlier_module_weight_to_fp16_palettized, x = input_51_cast_fp16)[name = tensor<string, []>("op_1421_cast_fp16")];`
935	`tensor<string, []> var_1427_pad_type_0 = const()[name = tensor<string, []>("op_1427_pad_type_0"), val = tensor<string, []>("valid")];`
936	`tensor<int32, [2]> var_1427_strides_0 = const()[name = tensor<string, []>("op_1427_strides_0"), val = tensor<int32, [2]>([1, 1])];`
937	`tensor<int32, [4]> var_1427_pad_0 = const()[name = tensor<string, []>("op_1427_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
938	`tensor<int32, [2]> var_1427_dilations_0 = const()[name = tensor<string, []>("op_1427_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
939	`tensor<int32, []> var_1427_groups_0 = const()[name = tensor<string, []>("op_1427_groups_0"), val = tensor<int32, []>(1)];`
940	tensor<fp16, [3072, 768, 1, 1]> layers_6_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(37566848))), name = tensor<string, []>("layers_6_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [16482]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(37533760))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
941	`tensor<fp16, [1, 3072, 1, 1500]> var_1427_cast_fp16 = conv(dilations = var_1427_dilations_0, groups = var_1427_groups_0, pad = var_1427_pad_0, pad_type = var_1427_pad_type_0, strides = var_1427_strides_0, weight = layers_6_fc1_outlier_module_weight_to_fp16_sparsified, x = input_51_cast_fp16)[name = tensor<string, []>("op_1427_cast_fp16")];`
942	`tensor<fp16, [1, 3072, 1, 1500]> input_53_cast_fp16 = add(x = var_1421_cast_fp16, y = var_1427_cast_fp16)[name = tensor<string, []>("input_53_cast_fp16")];`
943	`tensor<string, []> input_55_mode_0 = const()[name = tensor<string, []>("input_55_mode_0"), val = tensor<string, []>("EXACT")];`
944	`tensor<fp16, [1, 3072, 1, 1500]> input_55_cast_fp16 = gelu(mode = input_55_mode_0, x = input_53_cast_fp16)[name = tensor<string, []>("input_55_cast_fp16")];`
945	`tensor<string, []> var_1438_pad_type_0 = const()[name = tensor<string, []>("op_1438_pad_type_0"), val = tensor<string, []>("valid")];`
946	`tensor<int32, [2]> var_1438_strides_0 = const()[name = tensor<string, []>("op_1438_strides_0"), val = tensor<int32, [2]>([1, 1])];`
947	`tensor<int32, [4]> var_1438_pad_0 = const()[name = tensor<string, []>("op_1438_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
948	`tensor<int32, [2]> var_1438_dilations_0 = const()[name = tensor<string, []>("op_1438_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
949	`tensor<int32, []> var_1438_groups_0 = const()[name = tensor<string, []>("op_1438_groups_0"), val = tensor<int32, []>(1)];`
950	tensor<fp16, [768, 3072, 1, 1]> layers_6_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(37861824))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39041536))), name = tensor<string, []>("layers_6_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
951	`tensor<fp16, [768]> layers_6_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_6_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39041664)))];`
952	`tensor<fp16, [1, 768, 1, 1500]> var_1438_cast_fp16 = conv(bias = layers_6_fc2_inlier_module_bias_to_fp16, dilations = var_1438_dilations_0, groups = var_1438_groups_0, pad = var_1438_pad_0, pad_type = var_1438_pad_type_0, strides = var_1438_strides_0, weight = layers_6_fc2_inlier_module_weight_to_fp16_palettized, x = input_55_cast_fp16)[name = tensor<string, []>("op_1438_cast_fp16")];`
953	`tensor<string, []> var_1444_pad_type_0 = const()[name = tensor<string, []>("op_1444_pad_type_0"), val = tensor<string, []>("valid")];`
954	`tensor<int32, [2]> var_1444_strides_0 = const()[name = tensor<string, []>("op_1444_strides_0"), val = tensor<int32, [2]>([1, 1])];`
955	`tensor<int32, [4]> var_1444_pad_0 = const()[name = tensor<string, []>("op_1444_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
956	`tensor<int32, [2]> var_1444_dilations_0 = const()[name = tensor<string, []>("op_1444_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
957	`tensor<int32, []> var_1444_groups_0 = const()[name = tensor<string, []>("op_1444_groups_0"), val = tensor<int32, []>(1)];`
958	tensor<fp16, [768, 3072, 1, 1]> layers_6_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39079168))), name = tensor<string, []>("layers_6_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [17897]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39043264))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
959	`tensor<fp16, [1, 768, 1, 1500]> var_1444_cast_fp16 = conv(dilations = var_1444_dilations_0, groups = var_1444_groups_0, pad = var_1444_pad_0, pad_type = var_1444_pad_type_0, strides = var_1444_strides_0, weight = layers_6_fc2_outlier_module_weight_to_fp16_sparsified, x = input_55_cast_fp16)[name = tensor<string, []>("op_1444_cast_fp16")];`
960	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_17_cast_fp16 = add(x = var_1438_cast_fp16, y = var_1444_cast_fp16)[name = tensor<string, []>("hidden_states_17_cast_fp16")];`
961	`tensor<fp16, [1, 768, 1, 1500]> inputs_29_cast_fp16 = add(x = inputs_27_cast_fp16, y = hidden_states_17_cast_fp16)[name = tensor<string, []>("inputs_29_cast_fp16")];`
962	`tensor<int32, []> var_1450 = const()[name = tensor<string, []>("op_1450"), val = tensor<int32, []>(3)];`
963	`tensor<int32, [1]> out_29_axes_0 = const()[name = tensor<string, []>("out_29_axes_0"), val = tensor<int32, [1]>([1])];`
964	`tensor<fp16, []> var_1472_to_fp16 = const()[name = tensor<string, []>("op_1472_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
965	`tensor<fp16, [1, 768, 1, 1500]> out_29_cast_fp16 = layer_norm(axes = out_29_axes_0, epsilon = var_1472_to_fp16, x = inputs_29_cast_fp16)[name = tensor<string, []>("out_29_cast_fp16")];`
966	`tensor<fp16, [768]> obj_29_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_29_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39374144)))];`
967	`tensor<fp16, [768]> obj_29_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_29_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39375744)))];`
968	`tensor<fp16, []> obj_29_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_29_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
969	`tensor<fp16, [1, 768, 1, 1500]> obj_29_cast_fp16 = batch_norm(beta = obj_29_beta_0_to_fp16, epsilon = obj_29_epsilon_0_to_fp16, gamma = obj_29_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_29_cast_fp16)[name = tensor<string, []>("obj_29_cast_fp16")];`
970	`tensor<string, []> var_1494_pad_type_0 = const()[name = tensor<string, []>("op_1494_pad_type_0"), val = tensor<string, []>("valid")];`
971	`tensor<int32, [2]> var_1494_strides_0 = const()[name = tensor<string, []>("op_1494_strides_0"), val = tensor<int32, [2]>([1, 1])];`
972	`tensor<int32, [4]> var_1494_pad_0 = const()[name = tensor<string, []>("op_1494_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
973	`tensor<int32, [2]> var_1494_dilations_0 = const()[name = tensor<string, []>("op_1494_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
974	`tensor<int32, []> var_1494_groups_0 = const()[name = tensor<string, []>("op_1494_groups_0"), val = tensor<int32, []>(1)];`
975	tensor<fp16, [768, 768, 1, 1]> layers_7_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39377344))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39672320))), name = tensor<string, []>("layers_7_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
976	`tensor<fp16, [768]> layers_7_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_7_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39672448)))];`
977	`tensor<fp16, [1, 768, 1, 1500]> var_1494_cast_fp16 = conv(bias = layers_7_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_1494_dilations_0, groups = var_1494_groups_0, pad = var_1494_pad_0, pad_type = var_1494_pad_type_0, strides = var_1494_strides_0, weight = layers_7_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_29_cast_fp16)[name = tensor<string, []>("op_1494_cast_fp16")];`
978	`tensor<string, []> var_1500_pad_type_0 = const()[name = tensor<string, []>("op_1500_pad_type_0"), val = tensor<string, []>("valid")];`
979	`tensor<int32, [2]> var_1500_strides_0 = const()[name = tensor<string, []>("op_1500_strides_0"), val = tensor<int32, [2]>([1, 1])];`
980	`tensor<int32, [4]> var_1500_pad_0 = const()[name = tensor<string, []>("op_1500_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
981	`tensor<int32, [2]> var_1500_dilations_0 = const()[name = tensor<string, []>("op_1500_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
982	`tensor<int32, []> var_1500_groups_0 = const()[name = tensor<string, []>("op_1500_groups_0"), val = tensor<int32, []>(1)];`
983	tensor<fp16, [768, 768, 1, 1]> layers_7_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39680704))), name = tensor<string, []>("layers_7_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3266]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39674048))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
984	`tensor<fp16, [1, 768, 1, 1500]> var_1500_cast_fp16 = conv(dilations = var_1500_dilations_0, groups = var_1500_groups_0, pad = var_1500_pad_0, pad_type = var_1500_pad_type_0, strides = var_1500_strides_0, weight = layers_7_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_29_cast_fp16)[name = tensor<string, []>("op_1500_cast_fp16")];`
985	`tensor<fp16, [1, 768, 1, 1500]> query_15_cast_fp16 = add(x = var_1494_cast_fp16, y = var_1500_cast_fp16)[name = tensor<string, []>("query_15_cast_fp16")];`
986	`tensor<string, []> var_1509_pad_type_0 = const()[name = tensor<string, []>("op_1509_pad_type_0"), val = tensor<string, []>("valid")];`
987	`tensor<int32, [2]> var_1509_strides_0 = const()[name = tensor<string, []>("op_1509_strides_0"), val = tensor<int32, [2]>([1, 1])];`
988	`tensor<int32, [4]> var_1509_pad_0 = const()[name = tensor<string, []>("op_1509_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
989	`tensor<int32, [2]> var_1509_dilations_0 = const()[name = tensor<string, []>("op_1509_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
990	`tensor<int32, []> var_1509_groups_0 = const()[name = tensor<string, []>("op_1509_groups_0"), val = tensor<int32, []>(1)];`
991	tensor<fp16, [768, 768, 1, 1]> layers_7_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39754496))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40049472))), name = tensor<string, []>("layers_7_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
992	`tensor<fp16, [1, 768, 1, 1500]> var_1509_cast_fp16 = conv(dilations = var_1509_dilations_0, groups = var_1509_groups_0, pad = var_1509_pad_0, pad_type = var_1509_pad_type_0, strides = var_1509_strides_0, weight = layers_7_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_29_cast_fp16)[name = tensor<string, []>("op_1509_cast_fp16")];`
993	`tensor<string, []> var_1515_pad_type_0 = const()[name = tensor<string, []>("op_1515_pad_type_0"), val = tensor<string, []>("valid")];`
994	`tensor<int32, [2]> var_1515_strides_0 = const()[name = tensor<string, []>("op_1515_strides_0"), val = tensor<int32, [2]>([1, 1])];`
995	`tensor<int32, [4]> var_1515_pad_0 = const()[name = tensor<string, []>("op_1515_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
996	`tensor<int32, [2]> var_1515_dilations_0 = const()[name = tensor<string, []>("op_1515_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
997	`tensor<int32, []> var_1515_groups_0 = const()[name = tensor<string, []>("op_1515_groups_0"), val = tensor<int32, []>(1)];`
998	tensor<fp16, [768, 768, 1, 1]> layers_7_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40056832))), name = tensor<string, []>("layers_7_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3558]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40049600))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
999	`tensor<fp16, [1, 768, 1, 1500]> var_1515_cast_fp16 = conv(dilations = var_1515_dilations_0, groups = var_1515_groups_0, pad = var_1515_pad_0, pad_type = var_1515_pad_type_0, strides = var_1515_strides_0, weight = layers_7_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_29_cast_fp16)[name = tensor<string, []>("op_1515_cast_fp16")];`
1000	`tensor<fp16, [1, 768, 1, 1500]> key_15_cast_fp16 = add(x = var_1509_cast_fp16, y = var_1515_cast_fp16)[name = tensor<string, []>("key_15_cast_fp16")];`
1001	`tensor<string, []> var_1525_pad_type_0 = const()[name = tensor<string, []>("op_1525_pad_type_0"), val = tensor<string, []>("valid")];`
1002	`tensor<int32, [2]> var_1525_strides_0 = const()[name = tensor<string, []>("op_1525_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1003	`tensor<int32, [4]> var_1525_pad_0 = const()[name = tensor<string, []>("op_1525_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1004	`tensor<int32, [2]> var_1525_dilations_0 = const()[name = tensor<string, []>("op_1525_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1005	`tensor<int32, []> var_1525_groups_0 = const()[name = tensor<string, []>("op_1525_groups_0"), val = tensor<int32, []>(1)];`
1006	tensor<fp16, [768, 768, 1, 1]> layers_7_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40130624))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40425600))), name = tensor<string, []>("layers_7_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1007	`tensor<fp16, [768]> layers_7_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_7_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40425728)))];`
1008	`tensor<fp16, [1, 768, 1, 1500]> var_1525_cast_fp16 = conv(bias = layers_7_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_1525_dilations_0, groups = var_1525_groups_0, pad = var_1525_pad_0, pad_type = var_1525_pad_type_0, strides = var_1525_strides_0, weight = layers_7_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_29_cast_fp16)[name = tensor<string, []>("op_1525_cast_fp16")];`
1009	`tensor<string, []> var_1531_pad_type_0 = const()[name = tensor<string, []>("op_1531_pad_type_0"), val = tensor<string, []>("valid")];`
1010	`tensor<int32, [2]> var_1531_strides_0 = const()[name = tensor<string, []>("op_1531_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1011	`tensor<int32, [4]> var_1531_pad_0 = const()[name = tensor<string, []>("op_1531_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1012	`tensor<int32, [2]> var_1531_dilations_0 = const()[name = tensor<string, []>("op_1531_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1013	`tensor<int32, []> var_1531_groups_0 = const()[name = tensor<string, []>("op_1531_groups_0"), val = tensor<int32, []>(1)];`
1014	tensor<fp16, [768, 768, 1, 1]> layers_7_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40433728))), name = tensor<string, []>("layers_7_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3154]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40427328))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1015	`tensor<fp16, [1, 768, 1, 1500]> var_1531_cast_fp16 = conv(dilations = var_1531_dilations_0, groups = var_1531_groups_0, pad = var_1531_pad_0, pad_type = var_1531_pad_type_0, strides = var_1531_strides_0, weight = layers_7_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_29_cast_fp16)[name = tensor<string, []>("op_1531_cast_fp16")];`
1016	`tensor<fp16, [1, 768, 1, 1500]> value_15_cast_fp16 = add(x = var_1525_cast_fp16, y = var_1531_cast_fp16)[name = tensor<string, []>("value_15_cast_fp16")];`
1017	`tensor<int32, [4]> var_1535 = const()[name = tensor<string, []>("op_1535"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1018	`tensor<fp16, [1, 12, 64, 1500]> mh_q_15_cast_fp16 = reshape(shape = var_1535, x = query_15_cast_fp16)[name = tensor<string, []>("mh_q_15_cast_fp16")];`
1019	`tensor<fp16, []> var_1537_to_fp16 = const()[name = tensor<string, []>("op_1537_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
1020	`tensor<fp16, [1, 12, 64, 1500]> var_1538_cast_fp16 = mul(x = mh_q_15_cast_fp16, y = var_1537_to_fp16)[name = tensor<string, []>("op_1538_cast_fp16")];`
1021	`tensor<int32, [4]> var_1541 = const()[name = tensor<string, []>("op_1541"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1022	`tensor<fp16, [1, 12, 64, 1500]> var_1542_cast_fp16 = reshape(shape = var_1541, x = key_15_cast_fp16)[name = tensor<string, []>("op_1542_cast_fp16")];`
1023	`tensor<bool, []> mh_w_15_transpose_x_0 = const()[name = tensor<string, []>("mh_w_15_transpose_x_0"), val = tensor<bool, []>(true)];`
1024	`tensor<bool, []> mh_w_15_transpose_y_0 = const()[name = tensor<string, []>("mh_w_15_transpose_y_0"), val = tensor<bool, []>(false)];`
1025	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_15_cast_fp16 = matmul(transpose_x = mh_w_15_transpose_x_0, transpose_y = mh_w_15_transpose_y_0, x = var_1538_cast_fp16, y = var_1542_cast_fp16)[name = tensor<string, []>("mh_w_15_cast_fp16")];`
1026	`tensor<fp16, [1, 12, 1500, 1500]> var_1545_cast_fp16 = softmax(axis = var_1450, x = mh_w_15_cast_fp16)[name = tensor<string, []>("op_1545_cast_fp16")];`
1027	`tensor<int32, [4]> var_1546 = const()[name = tensor<string, []>("op_1546"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1028	`tensor<fp16, [1, 12, 64, 1500]> var_1547_cast_fp16 = reshape(shape = var_1546, x = value_15_cast_fp16)[name = tensor<string, []>("op_1547_cast_fp16")];`
1029	`tensor<bool, []> attn_15_transpose_x_0 = const()[name = tensor<string, []>("attn_15_transpose_x_0"), val = tensor<bool, []>(false)];`
1030	`tensor<bool, []> attn_15_transpose_y_0 = const()[name = tensor<string, []>("attn_15_transpose_y_0"), val = tensor<bool, []>(true)];`
1031	`tensor<fp16, [1, 12, 64, 1500]> attn_15_cast_fp16 = matmul(transpose_x = attn_15_transpose_x_0, transpose_y = attn_15_transpose_y_0, x = var_1547_cast_fp16, y = var_1545_cast_fp16)[name = tensor<string, []>("attn_15_cast_fp16")];`
1032	`tensor<int32, [4]> var_1550 = const()[name = tensor<string, []>("op_1550"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
1033	`tensor<fp16, [1, 768, 1, 1500]> input_57_cast_fp16 = reshape(shape = var_1550, x = attn_15_cast_fp16)[name = tensor<string, []>("input_57_cast_fp16")];`
1034	`tensor<string, []> var_1560_pad_type_0 = const()[name = tensor<string, []>("op_1560_pad_type_0"), val = tensor<string, []>("valid")];`
1035	`tensor<int32, [2]> var_1560_strides_0 = const()[name = tensor<string, []>("op_1560_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1036	`tensor<int32, [4]> var_1560_pad_0 = const()[name = tensor<string, []>("op_1560_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1037	`tensor<int32, [2]> var_1560_dilations_0 = const()[name = tensor<string, []>("op_1560_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1038	`tensor<int32, []> var_1560_groups_0 = const()[name = tensor<string, []>("op_1560_groups_0"), val = tensor<int32, []>(1)];`
1039	tensor<fp16, [768, 768, 1, 1]> layers_7_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40507520))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40802496))), name = tensor<string, []>("layers_7_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1040	`tensor<fp16, [768]> layers_7_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_7_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40802624)))];`
1041	`tensor<fp16, [1, 768, 1, 1500]> var_1560_cast_fp16 = conv(bias = layers_7_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_1560_dilations_0, groups = var_1560_groups_0, pad = var_1560_pad_0, pad_type = var_1560_pad_type_0, strides = var_1560_strides_0, weight = layers_7_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_57_cast_fp16)[name = tensor<string, []>("op_1560_cast_fp16")];`
1042	`tensor<string, []> var_1566_pad_type_0 = const()[name = tensor<string, []>("op_1566_pad_type_0"), val = tensor<string, []>("valid")];`
1043	`tensor<int32, [2]> var_1566_strides_0 = const()[name = tensor<string, []>("op_1566_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1044	`tensor<int32, [4]> var_1566_pad_0 = const()[name = tensor<string, []>("op_1566_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1045	`tensor<int32, [2]> var_1566_dilations_0 = const()[name = tensor<string, []>("op_1566_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1046	`tensor<int32, []> var_1566_groups_0 = const()[name = tensor<string, []>("op_1566_groups_0"), val = tensor<int32, []>(1)];`
1047	tensor<fp16, [768, 768, 1, 1]> layers_7_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40810112))), name = tensor<string, []>("layers_7_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [2902]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40804224))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1048	`tensor<fp16, [1, 768, 1, 1500]> var_1566_cast_fp16 = conv(dilations = var_1566_dilations_0, groups = var_1566_groups_0, pad = var_1566_pad_0, pad_type = var_1566_pad_type_0, strides = var_1566_strides_0, weight = layers_7_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_57_cast_fp16)[name = tensor<string, []>("op_1566_cast_fp16")];`
1049	`tensor<fp16, [1, 768, 1, 1500]> obj_31_cast_fp16 = add(x = var_1560_cast_fp16, y = var_1566_cast_fp16)[name = tensor<string, []>("obj_31_cast_fp16")];`
1050	`tensor<fp16, [1, 768, 1, 1500]> inputs_31_cast_fp16 = add(x = inputs_29_cast_fp16, y = obj_31_cast_fp16)[name = tensor<string, []>("inputs_31_cast_fp16")];`
1051	`tensor<int32, [1]> out_31_axes_0 = const()[name = tensor<string, []>("out_31_axes_0"), val = tensor<int32, [1]>([1])];`
1052	`tensor<fp16, []> var_1577_to_fp16 = const()[name = tensor<string, []>("op_1577_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1053	`tensor<fp16, [1, 768, 1, 1500]> out_31_cast_fp16 = layer_norm(axes = out_31_axes_0, epsilon = var_1577_to_fp16, x = inputs_31_cast_fp16)[name = tensor<string, []>("out_31_cast_fp16")];`
1054	`tensor<fp16, [768]> input_59_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_59_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40883904)))];`
1055	`tensor<fp16, [768]> input_59_beta_0_to_fp16 = const()[name = tensor<string, []>("input_59_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40885504)))];`
1056	`tensor<fp16, []> input_59_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_59_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1057	`tensor<fp16, [1, 768, 1, 1500]> input_59_cast_fp16 = batch_norm(beta = input_59_beta_0_to_fp16, epsilon = input_59_epsilon_0_to_fp16, gamma = input_59_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_31_cast_fp16)[name = tensor<string, []>("input_59_cast_fp16")];`
1058	`tensor<string, []> var_1595_pad_type_0 = const()[name = tensor<string, []>("op_1595_pad_type_0"), val = tensor<string, []>("valid")];`
1059	`tensor<int32, [2]> var_1595_strides_0 = const()[name = tensor<string, []>("op_1595_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1060	`tensor<int32, [4]> var_1595_pad_0 = const()[name = tensor<string, []>("op_1595_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1061	`tensor<int32, [2]> var_1595_dilations_0 = const()[name = tensor<string, []>("op_1595_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1062	`tensor<int32, []> var_1595_groups_0 = const()[name = tensor<string, []>("op_1595_groups_0"), val = tensor<int32, []>(1)];`
1063	tensor<fp16, [3072, 768, 1, 1]> layers_7_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(40887104))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(42066816))), name = tensor<string, []>("layers_7_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1064	`tensor<fp16, [3072]> layers_7_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_7_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(42066944)))];`
1065	`tensor<fp16, [1, 3072, 1, 1500]> var_1595_cast_fp16 = conv(bias = layers_7_fc1_inlier_module_bias_to_fp16, dilations = var_1595_dilations_0, groups = var_1595_groups_0, pad = var_1595_pad_0, pad_type = var_1595_pad_type_0, strides = var_1595_strides_0, weight = layers_7_fc1_inlier_module_weight_to_fp16_palettized, x = input_59_cast_fp16)[name = tensor<string, []>("op_1595_cast_fp16")];`
1066	`tensor<string, []> var_1601_pad_type_0 = const()[name = tensor<string, []>("op_1601_pad_type_0"), val = tensor<string, []>("valid")];`
1067	`tensor<int32, [2]> var_1601_strides_0 = const()[name = tensor<string, []>("op_1601_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1068	`tensor<int32, [4]> var_1601_pad_0 = const()[name = tensor<string, []>("op_1601_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1069	`tensor<int32, [2]> var_1601_dilations_0 = const()[name = tensor<string, []>("op_1601_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1070	`tensor<int32, []> var_1601_groups_0 = const()[name = tensor<string, []>("op_1601_groups_0"), val = tensor<int32, []>(1)];`
1071	tensor<fp16, [3072, 768, 1, 1]> layers_7_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(42110976))), name = tensor<string, []>("layers_7_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [18849]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(42073152))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1072	`tensor<fp16, [1, 3072, 1, 1500]> var_1601_cast_fp16 = conv(dilations = var_1601_dilations_0, groups = var_1601_groups_0, pad = var_1601_pad_0, pad_type = var_1601_pad_type_0, strides = var_1601_strides_0, weight = layers_7_fc1_outlier_module_weight_to_fp16_sparsified, x = input_59_cast_fp16)[name = tensor<string, []>("op_1601_cast_fp16")];`
1073	`tensor<fp16, [1, 3072, 1, 1500]> input_61_cast_fp16 = add(x = var_1595_cast_fp16, y = var_1601_cast_fp16)[name = tensor<string, []>("input_61_cast_fp16")];`
1074	`tensor<string, []> input_63_mode_0 = const()[name = tensor<string, []>("input_63_mode_0"), val = tensor<string, []>("EXACT")];`
1075	`tensor<fp16, [1, 3072, 1, 1500]> input_63_cast_fp16 = gelu(mode = input_63_mode_0, x = input_61_cast_fp16)[name = tensor<string, []>("input_63_cast_fp16")];`
1076	`tensor<string, []> var_1612_pad_type_0 = const()[name = tensor<string, []>("op_1612_pad_type_0"), val = tensor<string, []>("valid")];`
1077	`tensor<int32, [2]> var_1612_strides_0 = const()[name = tensor<string, []>("op_1612_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1078	`tensor<int32, [4]> var_1612_pad_0 = const()[name = tensor<string, []>("op_1612_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1079	`tensor<int32, [2]> var_1612_dilations_0 = const()[name = tensor<string, []>("op_1612_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1080	`tensor<int32, []> var_1612_groups_0 = const()[name = tensor<string, []>("op_1612_groups_0"), val = tensor<int32, []>(1)];`
1081	tensor<fp16, [768, 3072, 1, 1]> layers_7_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(42405952))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(43585664))), name = tensor<string, []>("layers_7_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1082	`tensor<fp16, [768]> layers_7_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_7_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(43585792)))];`
1083	`tensor<fp16, [1, 768, 1, 1500]> var_1612_cast_fp16 = conv(bias = layers_7_fc2_inlier_module_bias_to_fp16, dilations = var_1612_dilations_0, groups = var_1612_groups_0, pad = var_1612_pad_0, pad_type = var_1612_pad_type_0, strides = var_1612_strides_0, weight = layers_7_fc2_inlier_module_weight_to_fp16_palettized, x = input_63_cast_fp16)[name = tensor<string, []>("op_1612_cast_fp16")];`
1084	`tensor<string, []> var_1618_pad_type_0 = const()[name = tensor<string, []>("op_1618_pad_type_0"), val = tensor<string, []>("valid")];`
1085	`tensor<int32, [2]> var_1618_strides_0 = const()[name = tensor<string, []>("op_1618_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1086	`tensor<int32, [4]> var_1618_pad_0 = const()[name = tensor<string, []>("op_1618_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1087	`tensor<int32, [2]> var_1618_dilations_0 = const()[name = tensor<string, []>("op_1618_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1088	`tensor<int32, []> var_1618_groups_0 = const()[name = tensor<string, []>("op_1618_groups_0"), val = tensor<int32, []>(1)];`
1089	tensor<fp16, [768, 3072, 1, 1]> layers_7_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(43616960))), name = tensor<string, []>("layers_7_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [14729]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(43587392))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1090	`tensor<fp16, [1, 768, 1, 1500]> var_1618_cast_fp16 = conv(dilations = var_1618_dilations_0, groups = var_1618_groups_0, pad = var_1618_pad_0, pad_type = var_1618_pad_type_0, strides = var_1618_strides_0, weight = layers_7_fc2_outlier_module_weight_to_fp16_sparsified, x = input_63_cast_fp16)[name = tensor<string, []>("op_1618_cast_fp16")];`
1091	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_19_cast_fp16 = add(x = var_1612_cast_fp16, y = var_1618_cast_fp16)[name = tensor<string, []>("hidden_states_19_cast_fp16")];`
1092	`tensor<fp16, [1, 768, 1, 1500]> inputs_33_cast_fp16 = add(x = inputs_31_cast_fp16, y = hidden_states_19_cast_fp16)[name = tensor<string, []>("inputs_33_cast_fp16")];`
1093	`tensor<int32, []> var_1624 = const()[name = tensor<string, []>("op_1624"), val = tensor<int32, []>(3)];`
1094	`tensor<int32, [1]> out_33_axes_0 = const()[name = tensor<string, []>("out_33_axes_0"), val = tensor<int32, [1]>([1])];`
1095	`tensor<fp16, []> var_1646_to_fp16 = const()[name = tensor<string, []>("op_1646_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1096	`tensor<fp16, [1, 768, 1, 1500]> out_33_cast_fp16 = layer_norm(axes = out_33_axes_0, epsilon = var_1646_to_fp16, x = inputs_33_cast_fp16)[name = tensor<string, []>("out_33_cast_fp16")];`
1097	`tensor<fp16, [768]> obj_33_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_33_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(43911936)))];`
1098	`tensor<fp16, [768]> obj_33_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_33_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(43913536)))];`
1099	`tensor<fp16, []> obj_33_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_33_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1100	`tensor<fp16, [1, 768, 1, 1500]> obj_33_cast_fp16 = batch_norm(beta = obj_33_beta_0_to_fp16, epsilon = obj_33_epsilon_0_to_fp16, gamma = obj_33_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_33_cast_fp16)[name = tensor<string, []>("obj_33_cast_fp16")];`
1101	`tensor<string, []> var_1668_pad_type_0 = const()[name = tensor<string, []>("op_1668_pad_type_0"), val = tensor<string, []>("valid")];`
1102	`tensor<int32, [2]> var_1668_strides_0 = const()[name = tensor<string, []>("op_1668_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1103	`tensor<int32, [4]> var_1668_pad_0 = const()[name = tensor<string, []>("op_1668_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1104	`tensor<int32, [2]> var_1668_dilations_0 = const()[name = tensor<string, []>("op_1668_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1105	`tensor<int32, []> var_1668_groups_0 = const()[name = tensor<string, []>("op_1668_groups_0"), val = tensor<int32, []>(1)];`
1106	tensor<fp16, [768, 768, 1, 1]> layers_8_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(43915136))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44210112))), name = tensor<string, []>("layers_8_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1107	`tensor<fp16, [768]> layers_8_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_8_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44210240)))];`
1108	`tensor<fp16, [1, 768, 1, 1500]> var_1668_cast_fp16 = conv(bias = layers_8_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_1668_dilations_0, groups = var_1668_groups_0, pad = var_1668_pad_0, pad_type = var_1668_pad_type_0, strides = var_1668_strides_0, weight = layers_8_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_33_cast_fp16)[name = tensor<string, []>("op_1668_cast_fp16")];`
1109	`tensor<string, []> var_1674_pad_type_0 = const()[name = tensor<string, []>("op_1674_pad_type_0"), val = tensor<string, []>("valid")];`
1110	`tensor<int32, [2]> var_1674_strides_0 = const()[name = tensor<string, []>("op_1674_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1111	`tensor<int32, [4]> var_1674_pad_0 = const()[name = tensor<string, []>("op_1674_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1112	`tensor<int32, [2]> var_1674_dilations_0 = const()[name = tensor<string, []>("op_1674_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1113	`tensor<int32, []> var_1674_groups_0 = const()[name = tensor<string, []>("op_1674_groups_0"), val = tensor<int32, []>(1)];`
1114	tensor<fp16, [768, 768, 1, 1]> layers_8_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44219008))), name = tensor<string, []>("layers_8_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3550]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44211840))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1115	`tensor<fp16, [1, 768, 1, 1500]> var_1674_cast_fp16 = conv(dilations = var_1674_dilations_0, groups = var_1674_groups_0, pad = var_1674_pad_0, pad_type = var_1674_pad_type_0, strides = var_1674_strides_0, weight = layers_8_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_33_cast_fp16)[name = tensor<string, []>("op_1674_cast_fp16")];`
1116	`tensor<fp16, [1, 768, 1, 1500]> query_17_cast_fp16 = add(x = var_1668_cast_fp16, y = var_1674_cast_fp16)[name = tensor<string, []>("query_17_cast_fp16")];`
1117	`tensor<string, []> var_1683_pad_type_0 = const()[name = tensor<string, []>("op_1683_pad_type_0"), val = tensor<string, []>("valid")];`
1118	`tensor<int32, [2]> var_1683_strides_0 = const()[name = tensor<string, []>("op_1683_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1119	`tensor<int32, [4]> var_1683_pad_0 = const()[name = tensor<string, []>("op_1683_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1120	`tensor<int32, [2]> var_1683_dilations_0 = const()[name = tensor<string, []>("op_1683_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1121	`tensor<int32, []> var_1683_groups_0 = const()[name = tensor<string, []>("op_1683_groups_0"), val = tensor<int32, []>(1)];`
1122	tensor<fp16, [768, 768, 1, 1]> layers_8_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44292800))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44587776))), name = tensor<string, []>("layers_8_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1123	`tensor<fp16, [1, 768, 1, 1500]> var_1683_cast_fp16 = conv(dilations = var_1683_dilations_0, groups = var_1683_groups_0, pad = var_1683_pad_0, pad_type = var_1683_pad_type_0, strides = var_1683_strides_0, weight = layers_8_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_33_cast_fp16)[name = tensor<string, []>("op_1683_cast_fp16")];`
1124	`tensor<string, []> var_1689_pad_type_0 = const()[name = tensor<string, []>("op_1689_pad_type_0"), val = tensor<string, []>("valid")];`
1125	`tensor<int32, [2]> var_1689_strides_0 = const()[name = tensor<string, []>("op_1689_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1126	`tensor<int32, [4]> var_1689_pad_0 = const()[name = tensor<string, []>("op_1689_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1127	`tensor<int32, [2]> var_1689_dilations_0 = const()[name = tensor<string, []>("op_1689_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1128	`tensor<int32, []> var_1689_groups_0 = const()[name = tensor<string, []>("op_1689_groups_0"), val = tensor<int32, []>(1)];`
1129	tensor<fp16, [768, 768, 1, 1]> layers_8_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44595136))), name = tensor<string, []>("layers_8_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3567]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44587904))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1130	`tensor<fp16, [1, 768, 1, 1500]> var_1689_cast_fp16 = conv(dilations = var_1689_dilations_0, groups = var_1689_groups_0, pad = var_1689_pad_0, pad_type = var_1689_pad_type_0, strides = var_1689_strides_0, weight = layers_8_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_33_cast_fp16)[name = tensor<string, []>("op_1689_cast_fp16")];`
1131	`tensor<fp16, [1, 768, 1, 1500]> key_17_cast_fp16 = add(x = var_1683_cast_fp16, y = var_1689_cast_fp16)[name = tensor<string, []>("key_17_cast_fp16")];`
1132	`tensor<string, []> var_1699_pad_type_0 = const()[name = tensor<string, []>("op_1699_pad_type_0"), val = tensor<string, []>("valid")];`
1133	`tensor<int32, [2]> var_1699_strides_0 = const()[name = tensor<string, []>("op_1699_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1134	`tensor<int32, [4]> var_1699_pad_0 = const()[name = tensor<string, []>("op_1699_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1135	`tensor<int32, [2]> var_1699_dilations_0 = const()[name = tensor<string, []>("op_1699_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1136	`tensor<int32, []> var_1699_groups_0 = const()[name = tensor<string, []>("op_1699_groups_0"), val = tensor<int32, []>(1)];`
1137	tensor<fp16, [768, 768, 1, 1]> layers_8_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44668928))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44963904))), name = tensor<string, []>("layers_8_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1138	`tensor<fp16, [768]> layers_8_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_8_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44964032)))];`
1139	`tensor<fp16, [1, 768, 1, 1500]> var_1699_cast_fp16 = conv(bias = layers_8_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_1699_dilations_0, groups = var_1699_groups_0, pad = var_1699_pad_0, pad_type = var_1699_pad_type_0, strides = var_1699_strides_0, weight = layers_8_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_33_cast_fp16)[name = tensor<string, []>("op_1699_cast_fp16")];`
1140	`tensor<string, []> var_1705_pad_type_0 = const()[name = tensor<string, []>("op_1705_pad_type_0"), val = tensor<string, []>("valid")];`
1141	`tensor<int32, [2]> var_1705_strides_0 = const()[name = tensor<string, []>("op_1705_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1142	`tensor<int32, [4]> var_1705_pad_0 = const()[name = tensor<string, []>("op_1705_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1143	`tensor<int32, [2]> var_1705_dilations_0 = const()[name = tensor<string, []>("op_1705_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1144	`tensor<int32, []> var_1705_groups_0 = const()[name = tensor<string, []>("op_1705_groups_0"), val = tensor<int32, []>(1)];`
1145	tensor<fp16, [768, 768, 1, 1]> layers_8_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44971200))), name = tensor<string, []>("layers_8_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [2744]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(44965632))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1146	`tensor<fp16, [1, 768, 1, 1500]> var_1705_cast_fp16 = conv(dilations = var_1705_dilations_0, groups = var_1705_groups_0, pad = var_1705_pad_0, pad_type = var_1705_pad_type_0, strides = var_1705_strides_0, weight = layers_8_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_33_cast_fp16)[name = tensor<string, []>("op_1705_cast_fp16")];`
1147	`tensor<fp16, [1, 768, 1, 1500]> value_17_cast_fp16 = add(x = var_1699_cast_fp16, y = var_1705_cast_fp16)[name = tensor<string, []>("value_17_cast_fp16")];`
1148	`tensor<int32, [4]> var_1709 = const()[name = tensor<string, []>("op_1709"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1149	`tensor<fp16, [1, 12, 64, 1500]> mh_q_17_cast_fp16 = reshape(shape = var_1709, x = query_17_cast_fp16)[name = tensor<string, []>("mh_q_17_cast_fp16")];`
1150	`tensor<fp16, []> var_1711_to_fp16 = const()[name = tensor<string, []>("op_1711_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
1151	`tensor<fp16, [1, 12, 64, 1500]> var_1712_cast_fp16 = mul(x = mh_q_17_cast_fp16, y = var_1711_to_fp16)[name = tensor<string, []>("op_1712_cast_fp16")];`
1152	`tensor<int32, [4]> var_1715 = const()[name = tensor<string, []>("op_1715"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1153	`tensor<fp16, [1, 12, 64, 1500]> var_1716_cast_fp16 = reshape(shape = var_1715, x = key_17_cast_fp16)[name = tensor<string, []>("op_1716_cast_fp16")];`
1154	`tensor<bool, []> mh_w_17_transpose_x_0 = const()[name = tensor<string, []>("mh_w_17_transpose_x_0"), val = tensor<bool, []>(true)];`
1155	`tensor<bool, []> mh_w_17_transpose_y_0 = const()[name = tensor<string, []>("mh_w_17_transpose_y_0"), val = tensor<bool, []>(false)];`
1156	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_17_cast_fp16 = matmul(transpose_x = mh_w_17_transpose_x_0, transpose_y = mh_w_17_transpose_y_0, x = var_1712_cast_fp16, y = var_1716_cast_fp16)[name = tensor<string, []>("mh_w_17_cast_fp16")];`
1157	`tensor<fp16, [1, 12, 1500, 1500]> var_1719_cast_fp16 = softmax(axis = var_1624, x = mh_w_17_cast_fp16)[name = tensor<string, []>("op_1719_cast_fp16")];`
1158	`tensor<int32, [4]> var_1720 = const()[name = tensor<string, []>("op_1720"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1159	`tensor<fp16, [1, 12, 64, 1500]> var_1721_cast_fp16 = reshape(shape = var_1720, x = value_17_cast_fp16)[name = tensor<string, []>("op_1721_cast_fp16")];`
1160	`tensor<bool, []> attn_17_transpose_x_0 = const()[name = tensor<string, []>("attn_17_transpose_x_0"), val = tensor<bool, []>(false)];`
1161	`tensor<bool, []> attn_17_transpose_y_0 = const()[name = tensor<string, []>("attn_17_transpose_y_0"), val = tensor<bool, []>(true)];`
1162	`tensor<fp16, [1, 12, 64, 1500]> attn_17_cast_fp16 = matmul(transpose_x = attn_17_transpose_x_0, transpose_y = attn_17_transpose_y_0, x = var_1721_cast_fp16, y = var_1719_cast_fp16)[name = tensor<string, []>("attn_17_cast_fp16")];`
1163	`tensor<int32, [4]> var_1724 = const()[name = tensor<string, []>("op_1724"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
1164	`tensor<fp16, [1, 768, 1, 1500]> input_65_cast_fp16 = reshape(shape = var_1724, x = attn_17_cast_fp16)[name = tensor<string, []>("input_65_cast_fp16")];`
1165	`tensor<string, []> var_1734_pad_type_0 = const()[name = tensor<string, []>("op_1734_pad_type_0"), val = tensor<string, []>("valid")];`
1166	`tensor<int32, [2]> var_1734_strides_0 = const()[name = tensor<string, []>("op_1734_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1167	`tensor<int32, [4]> var_1734_pad_0 = const()[name = tensor<string, []>("op_1734_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1168	`tensor<int32, [2]> var_1734_dilations_0 = const()[name = tensor<string, []>("op_1734_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1169	`tensor<int32, []> var_1734_groups_0 = const()[name = tensor<string, []>("op_1734_groups_0"), val = tensor<int32, []>(1)];`
1170	tensor<fp16, [768, 768, 1, 1]> layers_8_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(45044992))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(45339968))), name = tensor<string, []>("layers_8_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1171	`tensor<fp16, [768]> layers_8_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_8_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(45340096)))];`
1172	`tensor<fp16, [1, 768, 1, 1500]> var_1734_cast_fp16 = conv(bias = layers_8_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_1734_dilations_0, groups = var_1734_groups_0, pad = var_1734_pad_0, pad_type = var_1734_pad_type_0, strides = var_1734_strides_0, weight = layers_8_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_65_cast_fp16)[name = tensor<string, []>("op_1734_cast_fp16")];`
1173	`tensor<string, []> var_1740_pad_type_0 = const()[name = tensor<string, []>("op_1740_pad_type_0"), val = tensor<string, []>("valid")];`
1174	`tensor<int32, [2]> var_1740_strides_0 = const()[name = tensor<string, []>("op_1740_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1175	`tensor<int32, [4]> var_1740_pad_0 = const()[name = tensor<string, []>("op_1740_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1176	`tensor<int32, [2]> var_1740_dilations_0 = const()[name = tensor<string, []>("op_1740_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1177	`tensor<int32, []> var_1740_groups_0 = const()[name = tensor<string, []>("op_1740_groups_0"), val = tensor<int32, []>(1)];`
1178	tensor<fp16, [768, 768, 1, 1]> layers_8_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(45347776))), name = tensor<string, []>("layers_8_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [2992]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(45341696))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1179	`tensor<fp16, [1, 768, 1, 1500]> var_1740_cast_fp16 = conv(dilations = var_1740_dilations_0, groups = var_1740_groups_0, pad = var_1740_pad_0, pad_type = var_1740_pad_type_0, strides = var_1740_strides_0, weight = layers_8_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_65_cast_fp16)[name = tensor<string, []>("op_1740_cast_fp16")];`
1180	`tensor<fp16, [1, 768, 1, 1500]> obj_35_cast_fp16 = add(x = var_1734_cast_fp16, y = var_1740_cast_fp16)[name = tensor<string, []>("obj_35_cast_fp16")];`
1181	`tensor<fp16, [1, 768, 1, 1500]> inputs_35_cast_fp16 = add(x = inputs_33_cast_fp16, y = obj_35_cast_fp16)[name = tensor<string, []>("inputs_35_cast_fp16")];`
1182	`tensor<int32, [1]> out_35_axes_0 = const()[name = tensor<string, []>("out_35_axes_0"), val = tensor<int32, [1]>([1])];`
1183	`tensor<fp16, []> var_1751_to_fp16 = const()[name = tensor<string, []>("op_1751_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1184	`tensor<fp16, [1, 768, 1, 1500]> out_35_cast_fp16 = layer_norm(axes = out_35_axes_0, epsilon = var_1751_to_fp16, x = inputs_35_cast_fp16)[name = tensor<string, []>("out_35_cast_fp16")];`
1185	`tensor<fp16, [768]> input_67_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_67_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(45421568)))];`
1186	`tensor<fp16, [768]> input_67_beta_0_to_fp16 = const()[name = tensor<string, []>("input_67_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(45423168)))];`
1187	`tensor<fp16, []> input_67_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_67_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1188	`tensor<fp16, [1, 768, 1, 1500]> input_67_cast_fp16 = batch_norm(beta = input_67_beta_0_to_fp16, epsilon = input_67_epsilon_0_to_fp16, gamma = input_67_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_35_cast_fp16)[name = tensor<string, []>("input_67_cast_fp16")];`
1189	`tensor<string, []> var_1769_pad_type_0 = const()[name = tensor<string, []>("op_1769_pad_type_0"), val = tensor<string, []>("valid")];`
1190	`tensor<int32, [2]> var_1769_strides_0 = const()[name = tensor<string, []>("op_1769_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1191	`tensor<int32, [4]> var_1769_pad_0 = const()[name = tensor<string, []>("op_1769_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1192	`tensor<int32, [2]> var_1769_dilations_0 = const()[name = tensor<string, []>("op_1769_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1193	`tensor<int32, []> var_1769_groups_0 = const()[name = tensor<string, []>("op_1769_groups_0"), val = tensor<int32, []>(1)];`
1194	tensor<fp16, [3072, 768, 1, 1]> layers_8_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(45424768))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(46604480))), name = tensor<string, []>("layers_8_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1195	`tensor<fp16, [3072]> layers_8_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_8_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(46604608)))];`
1196	`tensor<fp16, [1, 3072, 1, 1500]> var_1769_cast_fp16 = conv(bias = layers_8_fc1_inlier_module_bias_to_fp16, dilations = var_1769_dilations_0, groups = var_1769_groups_0, pad = var_1769_pad_0, pad_type = var_1769_pad_type_0, strides = var_1769_strides_0, weight = layers_8_fc1_inlier_module_weight_to_fp16_palettized, x = input_67_cast_fp16)[name = tensor<string, []>("op_1769_cast_fp16")];`
1197	`tensor<string, []> var_1775_pad_type_0 = const()[name = tensor<string, []>("op_1775_pad_type_0"), val = tensor<string, []>("valid")];`
1198	`tensor<int32, [2]> var_1775_strides_0 = const()[name = tensor<string, []>("op_1775_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1199	`tensor<int32, [4]> var_1775_pad_0 = const()[name = tensor<string, []>("op_1775_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1200	`tensor<int32, [2]> var_1775_dilations_0 = const()[name = tensor<string, []>("op_1775_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1201	`tensor<int32, []> var_1775_groups_0 = const()[name = tensor<string, []>("op_1775_groups_0"), val = tensor<int32, []>(1)];`
1202	tensor<fp16, [3072, 768, 1, 1]> layers_8_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(46641984))), name = tensor<string, []>("layers_8_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [15537]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(46610816))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1203	`tensor<fp16, [1, 3072, 1, 1500]> var_1775_cast_fp16 = conv(dilations = var_1775_dilations_0, groups = var_1775_groups_0, pad = var_1775_pad_0, pad_type = var_1775_pad_type_0, strides = var_1775_strides_0, weight = layers_8_fc1_outlier_module_weight_to_fp16_sparsified, x = input_67_cast_fp16)[name = tensor<string, []>("op_1775_cast_fp16")];`
1204	`tensor<fp16, [1, 3072, 1, 1500]> input_69_cast_fp16 = add(x = var_1769_cast_fp16, y = var_1775_cast_fp16)[name = tensor<string, []>("input_69_cast_fp16")];`
1205	`tensor<string, []> input_71_mode_0 = const()[name = tensor<string, []>("input_71_mode_0"), val = tensor<string, []>("EXACT")];`
1206	`tensor<fp16, [1, 3072, 1, 1500]> input_71_cast_fp16 = gelu(mode = input_71_mode_0, x = input_69_cast_fp16)[name = tensor<string, []>("input_71_cast_fp16")];`
1207	`tensor<string, []> var_1786_pad_type_0 = const()[name = tensor<string, []>("op_1786_pad_type_0"), val = tensor<string, []>("valid")];`
1208	`tensor<int32, [2]> var_1786_strides_0 = const()[name = tensor<string, []>("op_1786_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1209	`tensor<int32, [4]> var_1786_pad_0 = const()[name = tensor<string, []>("op_1786_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1210	`tensor<int32, [2]> var_1786_dilations_0 = const()[name = tensor<string, []>("op_1786_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1211	`tensor<int32, []> var_1786_groups_0 = const()[name = tensor<string, []>("op_1786_groups_0"), val = tensor<int32, []>(1)];`
1212	tensor<fp16, [768, 3072, 1, 1]> layers_8_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(46936960))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48116672))), name = tensor<string, []>("layers_8_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1213	`tensor<fp16, [768]> layers_8_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_8_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48116800)))];`
1214	`tensor<fp16, [1, 768, 1, 1500]> var_1786_cast_fp16 = conv(bias = layers_8_fc2_inlier_module_bias_to_fp16, dilations = var_1786_dilations_0, groups = var_1786_groups_0, pad = var_1786_pad_0, pad_type = var_1786_pad_type_0, strides = var_1786_strides_0, weight = layers_8_fc2_inlier_module_weight_to_fp16_palettized, x = input_71_cast_fp16)[name = tensor<string, []>("op_1786_cast_fp16")];`
1215	`tensor<string, []> var_1792_pad_type_0 = const()[name = tensor<string, []>("op_1792_pad_type_0"), val = tensor<string, []>("valid")];`
1216	`tensor<int32, [2]> var_1792_strides_0 = const()[name = tensor<string, []>("op_1792_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1217	`tensor<int32, [4]> var_1792_pad_0 = const()[name = tensor<string, []>("op_1792_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1218	`tensor<int32, [2]> var_1792_dilations_0 = const()[name = tensor<string, []>("op_1792_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1219	`tensor<int32, []> var_1792_groups_0 = const()[name = tensor<string, []>("op_1792_groups_0"), val = tensor<int32, []>(1)];`
1220	tensor<fp16, [768, 3072, 1, 1]> layers_8_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48148992))), name = tensor<string, []>("layers_8_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [15247]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48118400))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1221	`tensor<fp16, [1, 768, 1, 1500]> var_1792_cast_fp16 = conv(dilations = var_1792_dilations_0, groups = var_1792_groups_0, pad = var_1792_pad_0, pad_type = var_1792_pad_type_0, strides = var_1792_strides_0, weight = layers_8_fc2_outlier_module_weight_to_fp16_sparsified, x = input_71_cast_fp16)[name = tensor<string, []>("op_1792_cast_fp16")];`
1222	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_21_cast_fp16 = add(x = var_1786_cast_fp16, y = var_1792_cast_fp16)[name = tensor<string, []>("hidden_states_21_cast_fp16")];`
1223	`tensor<fp16, [1, 768, 1, 1500]> inputs_37_cast_fp16 = add(x = inputs_35_cast_fp16, y = hidden_states_21_cast_fp16)[name = tensor<string, []>("inputs_37_cast_fp16")];`
1224	`tensor<int32, []> var_1798 = const()[name = tensor<string, []>("op_1798"), val = tensor<int32, []>(3)];`
1225	`tensor<int32, [1]> out_37_axes_0 = const()[name = tensor<string, []>("out_37_axes_0"), val = tensor<int32, [1]>([1])];`
1226	`tensor<fp16, []> var_1820_to_fp16 = const()[name = tensor<string, []>("op_1820_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1227	`tensor<fp16, [1, 768, 1, 1500]> out_37_cast_fp16 = layer_norm(axes = out_37_axes_0, epsilon = var_1820_to_fp16, x = inputs_37_cast_fp16)[name = tensor<string, []>("out_37_cast_fp16")];`
1228	`tensor<fp16, [768]> obj_37_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_37_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48443968)))];`
1229	`tensor<fp16, [768]> obj_37_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_37_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48445568)))];`
1230	`tensor<fp16, []> obj_37_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_37_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1231	`tensor<fp16, [1, 768, 1, 1500]> obj_37_cast_fp16 = batch_norm(beta = obj_37_beta_0_to_fp16, epsilon = obj_37_epsilon_0_to_fp16, gamma = obj_37_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_37_cast_fp16)[name = tensor<string, []>("obj_37_cast_fp16")];`
1232	`tensor<string, []> var_1842_pad_type_0 = const()[name = tensor<string, []>("op_1842_pad_type_0"), val = tensor<string, []>("valid")];`
1233	`tensor<int32, [2]> var_1842_strides_0 = const()[name = tensor<string, []>("op_1842_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1234	`tensor<int32, [4]> var_1842_pad_0 = const()[name = tensor<string, []>("op_1842_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1235	`tensor<int32, [2]> var_1842_dilations_0 = const()[name = tensor<string, []>("op_1842_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1236	`tensor<int32, []> var_1842_groups_0 = const()[name = tensor<string, []>("op_1842_groups_0"), val = tensor<int32, []>(1)];`
1237	tensor<fp16, [768, 768, 1, 1]> layers_9_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48447168))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48742144))), name = tensor<string, []>("layers_9_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1238	`tensor<fp16, [768]> layers_9_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_9_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48742272)))];`
1239	`tensor<fp16, [1, 768, 1, 1500]> var_1842_cast_fp16 = conv(bias = layers_9_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_1842_dilations_0, groups = var_1842_groups_0, pad = var_1842_pad_0, pad_type = var_1842_pad_type_0, strides = var_1842_strides_0, weight = layers_9_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_37_cast_fp16)[name = tensor<string, []>("op_1842_cast_fp16")];`
1240	`tensor<string, []> var_1848_pad_type_0 = const()[name = tensor<string, []>("op_1848_pad_type_0"), val = tensor<string, []>("valid")];`
1241	`tensor<int32, [2]> var_1848_strides_0 = const()[name = tensor<string, []>("op_1848_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1242	`tensor<int32, [4]> var_1848_pad_0 = const()[name = tensor<string, []>("op_1848_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1243	`tensor<int32, [2]> var_1848_dilations_0 = const()[name = tensor<string, []>("op_1848_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1244	`tensor<int32, []> var_1848_groups_0 = const()[name = tensor<string, []>("op_1848_groups_0"), val = tensor<int32, []>(1)];`
1245	tensor<fp16, [768, 768, 1, 1]> layers_9_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48750080))), name = tensor<string, []>("layers_9_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3064]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48743872))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1246	`tensor<fp16, [1, 768, 1, 1500]> var_1848_cast_fp16 = conv(dilations = var_1848_dilations_0, groups = var_1848_groups_0, pad = var_1848_pad_0, pad_type = var_1848_pad_type_0, strides = var_1848_strides_0, weight = layers_9_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_37_cast_fp16)[name = tensor<string, []>("op_1848_cast_fp16")];`
1247	`tensor<fp16, [1, 768, 1, 1500]> query_19_cast_fp16 = add(x = var_1842_cast_fp16, y = var_1848_cast_fp16)[name = tensor<string, []>("query_19_cast_fp16")];`
1248	`tensor<string, []> var_1857_pad_type_0 = const()[name = tensor<string, []>("op_1857_pad_type_0"), val = tensor<string, []>("valid")];`
1249	`tensor<int32, [2]> var_1857_strides_0 = const()[name = tensor<string, []>("op_1857_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1250	`tensor<int32, [4]> var_1857_pad_0 = const()[name = tensor<string, []>("op_1857_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1251	`tensor<int32, [2]> var_1857_dilations_0 = const()[name = tensor<string, []>("op_1857_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1252	`tensor<int32, []> var_1857_groups_0 = const()[name = tensor<string, []>("op_1857_groups_0"), val = tensor<int32, []>(1)];`
1253	tensor<fp16, [768, 768, 1, 1]> layers_9_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(48823872))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49118848))), name = tensor<string, []>("layers_9_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1254	`tensor<fp16, [1, 768, 1, 1500]> var_1857_cast_fp16 = conv(dilations = var_1857_dilations_0, groups = var_1857_groups_0, pad = var_1857_pad_0, pad_type = var_1857_pad_type_0, strides = var_1857_strides_0, weight = layers_9_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_37_cast_fp16)[name = tensor<string, []>("op_1857_cast_fp16")];`
1255	`tensor<string, []> var_1863_pad_type_0 = const()[name = tensor<string, []>("op_1863_pad_type_0"), val = tensor<string, []>("valid")];`
1256	`tensor<int32, [2]> var_1863_strides_0 = const()[name = tensor<string, []>("op_1863_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1257	`tensor<int32, [4]> var_1863_pad_0 = const()[name = tensor<string, []>("op_1863_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1258	`tensor<int32, [2]> var_1863_dilations_0 = const()[name = tensor<string, []>("op_1863_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1259	`tensor<int32, []> var_1863_groups_0 = const()[name = tensor<string, []>("op_1863_groups_0"), val = tensor<int32, []>(1)];`
1260	tensor<fp16, [768, 768, 1, 1]> layers_9_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49125760))), name = tensor<string, []>("layers_9_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3358]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49118976))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1261	`tensor<fp16, [1, 768, 1, 1500]> var_1863_cast_fp16 = conv(dilations = var_1863_dilations_0, groups = var_1863_groups_0, pad = var_1863_pad_0, pad_type = var_1863_pad_type_0, strides = var_1863_strides_0, weight = layers_9_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_37_cast_fp16)[name = tensor<string, []>("op_1863_cast_fp16")];`
1262	`tensor<fp16, [1, 768, 1, 1500]> key_19_cast_fp16 = add(x = var_1857_cast_fp16, y = var_1863_cast_fp16)[name = tensor<string, []>("key_19_cast_fp16")];`
1263	`tensor<string, []> var_1873_pad_type_0 = const()[name = tensor<string, []>("op_1873_pad_type_0"), val = tensor<string, []>("valid")];`
1264	`tensor<int32, [2]> var_1873_strides_0 = const()[name = tensor<string, []>("op_1873_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1265	`tensor<int32, [4]> var_1873_pad_0 = const()[name = tensor<string, []>("op_1873_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1266	`tensor<int32, [2]> var_1873_dilations_0 = const()[name = tensor<string, []>("op_1873_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1267	`tensor<int32, []> var_1873_groups_0 = const()[name = tensor<string, []>("op_1873_groups_0"), val = tensor<int32, []>(1)];`
1268	tensor<fp16, [768, 768, 1, 1]> layers_9_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49199552))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49494528))), name = tensor<string, []>("layers_9_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1269	`tensor<fp16, [768]> layers_9_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_9_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49494656)))];`
1270	`tensor<fp16, [1, 768, 1, 1500]> var_1873_cast_fp16 = conv(bias = layers_9_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_1873_dilations_0, groups = var_1873_groups_0, pad = var_1873_pad_0, pad_type = var_1873_pad_type_0, strides = var_1873_strides_0, weight = layers_9_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_37_cast_fp16)[name = tensor<string, []>("op_1873_cast_fp16")];`
1271	`tensor<string, []> var_1879_pad_type_0 = const()[name = tensor<string, []>("op_1879_pad_type_0"), val = tensor<string, []>("valid")];`
1272	`tensor<int32, [2]> var_1879_strides_0 = const()[name = tensor<string, []>("op_1879_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1273	`tensor<int32, [4]> var_1879_pad_0 = const()[name = tensor<string, []>("op_1879_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1274	`tensor<int32, [2]> var_1879_dilations_0 = const()[name = tensor<string, []>("op_1879_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1275	`tensor<int32, []> var_1879_groups_0 = const()[name = tensor<string, []>("op_1879_groups_0"), val = tensor<int32, []>(1)];`
1276	tensor<fp16, [768, 768, 1, 1]> layers_9_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49501760))), name = tensor<string, []>("layers_9_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [2711]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49496256))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1277	`tensor<fp16, [1, 768, 1, 1500]> var_1879_cast_fp16 = conv(dilations = var_1879_dilations_0, groups = var_1879_groups_0, pad = var_1879_pad_0, pad_type = var_1879_pad_type_0, strides = var_1879_strides_0, weight = layers_9_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_37_cast_fp16)[name = tensor<string, []>("op_1879_cast_fp16")];`
1278	`tensor<fp16, [1, 768, 1, 1500]> value_19_cast_fp16 = add(x = var_1873_cast_fp16, y = var_1879_cast_fp16)[name = tensor<string, []>("value_19_cast_fp16")];`
1279	`tensor<int32, [4]> var_1883 = const()[name = tensor<string, []>("op_1883"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1280	`tensor<fp16, [1, 12, 64, 1500]> mh_q_19_cast_fp16 = reshape(shape = var_1883, x = query_19_cast_fp16)[name = tensor<string, []>("mh_q_19_cast_fp16")];`
1281	`tensor<fp16, []> var_1885_to_fp16 = const()[name = tensor<string, []>("op_1885_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
1282	`tensor<fp16, [1, 12, 64, 1500]> var_1886_cast_fp16 = mul(x = mh_q_19_cast_fp16, y = var_1885_to_fp16)[name = tensor<string, []>("op_1886_cast_fp16")];`
1283	`tensor<int32, [4]> var_1889 = const()[name = tensor<string, []>("op_1889"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1284	`tensor<fp16, [1, 12, 64, 1500]> var_1890_cast_fp16 = reshape(shape = var_1889, x = key_19_cast_fp16)[name = tensor<string, []>("op_1890_cast_fp16")];`
1285	`tensor<bool, []> mh_w_19_transpose_x_0 = const()[name = tensor<string, []>("mh_w_19_transpose_x_0"), val = tensor<bool, []>(true)];`
1286	`tensor<bool, []> mh_w_19_transpose_y_0 = const()[name = tensor<string, []>("mh_w_19_transpose_y_0"), val = tensor<bool, []>(false)];`
1287	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_19_cast_fp16 = matmul(transpose_x = mh_w_19_transpose_x_0, transpose_y = mh_w_19_transpose_y_0, x = var_1886_cast_fp16, y = var_1890_cast_fp16)[name = tensor<string, []>("mh_w_19_cast_fp16")];`
1288	`tensor<fp16, [1, 12, 1500, 1500]> var_1893_cast_fp16 = softmax(axis = var_1798, x = mh_w_19_cast_fp16)[name = tensor<string, []>("op_1893_cast_fp16")];`
1289	`tensor<int32, [4]> var_1894 = const()[name = tensor<string, []>("op_1894"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1290	`tensor<fp16, [1, 12, 64, 1500]> var_1895_cast_fp16 = reshape(shape = var_1894, x = value_19_cast_fp16)[name = tensor<string, []>("op_1895_cast_fp16")];`
1291	`tensor<bool, []> attn_19_transpose_x_0 = const()[name = tensor<string, []>("attn_19_transpose_x_0"), val = tensor<bool, []>(false)];`
1292	`tensor<bool, []> attn_19_transpose_y_0 = const()[name = tensor<string, []>("attn_19_transpose_y_0"), val = tensor<bool, []>(true)];`
1293	`tensor<fp16, [1, 12, 64, 1500]> attn_19_cast_fp16 = matmul(transpose_x = attn_19_transpose_x_0, transpose_y = attn_19_transpose_y_0, x = var_1895_cast_fp16, y = var_1893_cast_fp16)[name = tensor<string, []>("attn_19_cast_fp16")];`
1294	`tensor<int32, [4]> var_1898 = const()[name = tensor<string, []>("op_1898"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
1295	`tensor<fp16, [1, 768, 1, 1500]> input_73_cast_fp16 = reshape(shape = var_1898, x = attn_19_cast_fp16)[name = tensor<string, []>("input_73_cast_fp16")];`
1296	`tensor<string, []> var_1908_pad_type_0 = const()[name = tensor<string, []>("op_1908_pad_type_0"), val = tensor<string, []>("valid")];`
1297	`tensor<int32, [2]> var_1908_strides_0 = const()[name = tensor<string, []>("op_1908_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1298	`tensor<int32, [4]> var_1908_pad_0 = const()[name = tensor<string, []>("op_1908_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1299	`tensor<int32, [2]> var_1908_dilations_0 = const()[name = tensor<string, []>("op_1908_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1300	`tensor<int32, []> var_1908_groups_0 = const()[name = tensor<string, []>("op_1908_groups_0"), val = tensor<int32, []>(1)];`
1301	tensor<fp16, [768, 768, 1, 1]> layers_9_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49575552))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49870528))), name = tensor<string, []>("layers_9_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1302	`tensor<fp16, [768]> layers_9_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_9_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49870656)))];`
1303	`tensor<fp16, [1, 768, 1, 1500]> var_1908_cast_fp16 = conv(bias = layers_9_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_1908_dilations_0, groups = var_1908_groups_0, pad = var_1908_pad_0, pad_type = var_1908_pad_type_0, strides = var_1908_strides_0, weight = layers_9_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_73_cast_fp16)[name = tensor<string, []>("op_1908_cast_fp16")];`
1304	`tensor<string, []> var_1914_pad_type_0 = const()[name = tensor<string, []>("op_1914_pad_type_0"), val = tensor<string, []>("valid")];`
1305	`tensor<int32, [2]> var_1914_strides_0 = const()[name = tensor<string, []>("op_1914_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1306	`tensor<int32, [4]> var_1914_pad_0 = const()[name = tensor<string, []>("op_1914_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1307	`tensor<int32, [2]> var_1914_dilations_0 = const()[name = tensor<string, []>("op_1914_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1308	`tensor<int32, []> var_1914_groups_0 = const()[name = tensor<string, []>("op_1914_groups_0"), val = tensor<int32, []>(1)];`
1309	tensor<fp16, [768, 768, 1, 1]> layers_9_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49877760))), name = tensor<string, []>("layers_9_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [2712]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49872256))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1310	`tensor<fp16, [1, 768, 1, 1500]> var_1914_cast_fp16 = conv(dilations = var_1914_dilations_0, groups = var_1914_groups_0, pad = var_1914_pad_0, pad_type = var_1914_pad_type_0, strides = var_1914_strides_0, weight = layers_9_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_73_cast_fp16)[name = tensor<string, []>("op_1914_cast_fp16")];`
1311	`tensor<fp16, [1, 768, 1, 1500]> obj_39_cast_fp16 = add(x = var_1908_cast_fp16, y = var_1914_cast_fp16)[name = tensor<string, []>("obj_39_cast_fp16")];`
1312	`tensor<fp16, [1, 768, 1, 1500]> inputs_39_cast_fp16 = add(x = inputs_37_cast_fp16, y = obj_39_cast_fp16)[name = tensor<string, []>("inputs_39_cast_fp16")];`
1313	`tensor<int32, [1]> out_39_axes_0 = const()[name = tensor<string, []>("out_39_axes_0"), val = tensor<int32, [1]>([1])];`
1314	`tensor<fp16, []> var_1925_to_fp16 = const()[name = tensor<string, []>("op_1925_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1315	`tensor<fp16, [1, 768, 1, 1500]> out_39_cast_fp16 = layer_norm(axes = out_39_axes_0, epsilon = var_1925_to_fp16, x = inputs_39_cast_fp16)[name = tensor<string, []>("out_39_cast_fp16")];`
1316	`tensor<fp16, [768]> input_75_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_75_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49951552)))];`
1317	`tensor<fp16, [768]> input_75_beta_0_to_fp16 = const()[name = tensor<string, []>("input_75_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49953152)))];`
1318	`tensor<fp16, []> input_75_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_75_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1319	`tensor<fp16, [1, 768, 1, 1500]> input_75_cast_fp16 = batch_norm(beta = input_75_beta_0_to_fp16, epsilon = input_75_epsilon_0_to_fp16, gamma = input_75_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_39_cast_fp16)[name = tensor<string, []>("input_75_cast_fp16")];`
1320	`tensor<string, []> var_1943_pad_type_0 = const()[name = tensor<string, []>("op_1943_pad_type_0"), val = tensor<string, []>("valid")];`
1321	`tensor<int32, [2]> var_1943_strides_0 = const()[name = tensor<string, []>("op_1943_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1322	`tensor<int32, [4]> var_1943_pad_0 = const()[name = tensor<string, []>("op_1943_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1323	`tensor<int32, [2]> var_1943_dilations_0 = const()[name = tensor<string, []>("op_1943_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1324	`tensor<int32, []> var_1943_groups_0 = const()[name = tensor<string, []>("op_1943_groups_0"), val = tensor<int32, []>(1)];`
1325	tensor<fp16, [3072, 768, 1, 1]> layers_9_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(49954752))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(51134464))), name = tensor<string, []>("layers_9_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1326	`tensor<fp16, [3072]> layers_9_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_9_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(51134592)))];`
1327	`tensor<fp16, [1, 3072, 1, 1500]> var_1943_cast_fp16 = conv(bias = layers_9_fc1_inlier_module_bias_to_fp16, dilations = var_1943_dilations_0, groups = var_1943_groups_0, pad = var_1943_pad_0, pad_type = var_1943_pad_type_0, strides = var_1943_strides_0, weight = layers_9_fc1_inlier_module_weight_to_fp16_palettized, x = input_75_cast_fp16)[name = tensor<string, []>("op_1943_cast_fp16")];`
1328	`tensor<string, []> var_1949_pad_type_0 = const()[name = tensor<string, []>("op_1949_pad_type_0"), val = tensor<string, []>("valid")];`
1329	`tensor<int32, [2]> var_1949_strides_0 = const()[name = tensor<string, []>("op_1949_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1330	`tensor<int32, [4]> var_1949_pad_0 = const()[name = tensor<string, []>("op_1949_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1331	`tensor<int32, [2]> var_1949_dilations_0 = const()[name = tensor<string, []>("op_1949_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1332	`tensor<int32, []> var_1949_groups_0 = const()[name = tensor<string, []>("op_1949_groups_0"), val = tensor<int32, []>(1)];`
1333	tensor<fp16, [3072, 768, 1, 1]> layers_9_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(51171648))), name = tensor<string, []>("layers_9_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [15382]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(51140800))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1334	`tensor<fp16, [1, 3072, 1, 1500]> var_1949_cast_fp16 = conv(dilations = var_1949_dilations_0, groups = var_1949_groups_0, pad = var_1949_pad_0, pad_type = var_1949_pad_type_0, strides = var_1949_strides_0, weight = layers_9_fc1_outlier_module_weight_to_fp16_sparsified, x = input_75_cast_fp16)[name = tensor<string, []>("op_1949_cast_fp16")];`
1335	`tensor<fp16, [1, 3072, 1, 1500]> input_77_cast_fp16 = add(x = var_1943_cast_fp16, y = var_1949_cast_fp16)[name = tensor<string, []>("input_77_cast_fp16")];`
1336	`tensor<string, []> input_79_mode_0 = const()[name = tensor<string, []>("input_79_mode_0"), val = tensor<string, []>("EXACT")];`
1337	`tensor<fp16, [1, 3072, 1, 1500]> input_79_cast_fp16 = gelu(mode = input_79_mode_0, x = input_77_cast_fp16)[name = tensor<string, []>("input_79_cast_fp16")];`
1338	`tensor<string, []> var_1960_pad_type_0 = const()[name = tensor<string, []>("op_1960_pad_type_0"), val = tensor<string, []>("valid")];`
1339	`tensor<int32, [2]> var_1960_strides_0 = const()[name = tensor<string, []>("op_1960_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1340	`tensor<int32, [4]> var_1960_pad_0 = const()[name = tensor<string, []>("op_1960_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1341	`tensor<int32, [2]> var_1960_dilations_0 = const()[name = tensor<string, []>("op_1960_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1342	`tensor<int32, []> var_1960_groups_0 = const()[name = tensor<string, []>("op_1960_groups_0"), val = tensor<int32, []>(1)];`
1343	tensor<fp16, [768, 3072, 1, 1]> layers_9_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(51466624))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(52646336))), name = tensor<string, []>("layers_9_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1344	`tensor<fp16, [768]> layers_9_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_9_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(52646464)))];`
1345	`tensor<fp16, [1, 768, 1, 1500]> var_1960_cast_fp16 = conv(bias = layers_9_fc2_inlier_module_bias_to_fp16, dilations = var_1960_dilations_0, groups = var_1960_groups_0, pad = var_1960_pad_0, pad_type = var_1960_pad_type_0, strides = var_1960_strides_0, weight = layers_9_fc2_inlier_module_weight_to_fp16_palettized, x = input_79_cast_fp16)[name = tensor<string, []>("op_1960_cast_fp16")];`
1346	`tensor<string, []> var_1966_pad_type_0 = const()[name = tensor<string, []>("op_1966_pad_type_0"), val = tensor<string, []>("valid")];`
1347	`tensor<int32, [2]> var_1966_strides_0 = const()[name = tensor<string, []>("op_1966_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1348	`tensor<int32, [4]> var_1966_pad_0 = const()[name = tensor<string, []>("op_1966_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1349	`tensor<int32, [2]> var_1966_dilations_0 = const()[name = tensor<string, []>("op_1966_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1350	`tensor<int32, []> var_1966_groups_0 = const()[name = tensor<string, []>("op_1966_groups_0"), val = tensor<int32, []>(1)];`
1351	tensor<fp16, [768, 3072, 1, 1]> layers_9_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(52680576))), name = tensor<string, []>("layers_9_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [16208]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(52648064))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1352	`tensor<fp16, [1, 768, 1, 1500]> var_1966_cast_fp16 = conv(dilations = var_1966_dilations_0, groups = var_1966_groups_0, pad = var_1966_pad_0, pad_type = var_1966_pad_type_0, strides = var_1966_strides_0, weight = layers_9_fc2_outlier_module_weight_to_fp16_sparsified, x = input_79_cast_fp16)[name = tensor<string, []>("op_1966_cast_fp16")];`
1353	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_23_cast_fp16 = add(x = var_1960_cast_fp16, y = var_1966_cast_fp16)[name = tensor<string, []>("hidden_states_23_cast_fp16")];`
1354	`tensor<fp16, [1, 768, 1, 1500]> inputs_41_cast_fp16 = add(x = inputs_39_cast_fp16, y = hidden_states_23_cast_fp16)[name = tensor<string, []>("inputs_41_cast_fp16")];`
1355	`tensor<int32, []> var_1972 = const()[name = tensor<string, []>("op_1972"), val = tensor<int32, []>(3)];`
1356	`tensor<int32, [1]> out_41_axes_0 = const()[name = tensor<string, []>("out_41_axes_0"), val = tensor<int32, [1]>([1])];`
1357	`tensor<fp16, []> var_1994_to_fp16 = const()[name = tensor<string, []>("op_1994_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1358	`tensor<fp16, [1, 768, 1, 1500]> out_41_cast_fp16 = layer_norm(axes = out_41_axes_0, epsilon = var_1994_to_fp16, x = inputs_41_cast_fp16)[name = tensor<string, []>("out_41_cast_fp16")];`
1359	`tensor<fp16, [768]> obj_41_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_41_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(52975552)))];`
1360	`tensor<fp16, [768]> obj_41_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_41_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(52977152)))];`
1361	`tensor<fp16, []> obj_41_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_41_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1362	`tensor<fp16, [1, 768, 1, 1500]> obj_41_cast_fp16 = batch_norm(beta = obj_41_beta_0_to_fp16, epsilon = obj_41_epsilon_0_to_fp16, gamma = obj_41_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_41_cast_fp16)[name = tensor<string, []>("obj_41_cast_fp16")];`
1363	`tensor<string, []> var_2016_pad_type_0 = const()[name = tensor<string, []>("op_2016_pad_type_0"), val = tensor<string, []>("valid")];`
1364	`tensor<int32, [2]> var_2016_strides_0 = const()[name = tensor<string, []>("op_2016_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1365	`tensor<int32, [4]> var_2016_pad_0 = const()[name = tensor<string, []>("op_2016_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1366	`tensor<int32, [2]> var_2016_dilations_0 = const()[name = tensor<string, []>("op_2016_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1367	`tensor<int32, []> var_2016_groups_0 = const()[name = tensor<string, []>("op_2016_groups_0"), val = tensor<int32, []>(1)];`
1368	tensor<fp16, [768, 768, 1, 1]> layers_10_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(52978752))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(53273728))), name = tensor<string, []>("layers_10_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1369	`tensor<fp16, [768]> layers_10_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_10_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(53273856)))];`
1370	`tensor<fp16, [1, 768, 1, 1500]> var_2016_cast_fp16 = conv(bias = layers_10_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_2016_dilations_0, groups = var_2016_groups_0, pad = var_2016_pad_0, pad_type = var_2016_pad_type_0, strides = var_2016_strides_0, weight = layers_10_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_41_cast_fp16)[name = tensor<string, []>("op_2016_cast_fp16")];`
1371	`tensor<string, []> var_2022_pad_type_0 = const()[name = tensor<string, []>("op_2022_pad_type_0"), val = tensor<string, []>("valid")];`
1372	`tensor<int32, [2]> var_2022_strides_0 = const()[name = tensor<string, []>("op_2022_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1373	`tensor<int32, [4]> var_2022_pad_0 = const()[name = tensor<string, []>("op_2022_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1374	`tensor<int32, [2]> var_2022_dilations_0 = const()[name = tensor<string, []>("op_2022_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1375	`tensor<int32, []> var_2022_groups_0 = const()[name = tensor<string, []>("op_2022_groups_0"), val = tensor<int32, []>(1)];`
1376	tensor<fp16, [768, 768, 1, 1]> layers_10_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(53281536))), name = tensor<string, []>("layers_10_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3007]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(53275456))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1377	`tensor<fp16, [1, 768, 1, 1500]> var_2022_cast_fp16 = conv(dilations = var_2022_dilations_0, groups = var_2022_groups_0, pad = var_2022_pad_0, pad_type = var_2022_pad_type_0, strides = var_2022_strides_0, weight = layers_10_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_41_cast_fp16)[name = tensor<string, []>("op_2022_cast_fp16")];`
1378	`tensor<fp16, [1, 768, 1, 1500]> query_21_cast_fp16 = add(x = var_2016_cast_fp16, y = var_2022_cast_fp16)[name = tensor<string, []>("query_21_cast_fp16")];`
1379	`tensor<string, []> var_2031_pad_type_0 = const()[name = tensor<string, []>("op_2031_pad_type_0"), val = tensor<string, []>("valid")];`
1380	`tensor<int32, [2]> var_2031_strides_0 = const()[name = tensor<string, []>("op_2031_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1381	`tensor<int32, [4]> var_2031_pad_0 = const()[name = tensor<string, []>("op_2031_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1382	`tensor<int32, [2]> var_2031_dilations_0 = const()[name = tensor<string, []>("op_2031_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1383	`tensor<int32, []> var_2031_groups_0 = const()[name = tensor<string, []>("op_2031_groups_0"), val = tensor<int32, []>(1)];`
1384	tensor<fp16, [768, 768, 1, 1]> layers_10_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(53355328))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(53650304))), name = tensor<string, []>("layers_10_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1385	`tensor<fp16, [1, 768, 1, 1500]> var_2031_cast_fp16 = conv(dilations = var_2031_dilations_0, groups = var_2031_groups_0, pad = var_2031_pad_0, pad_type = var_2031_pad_type_0, strides = var_2031_strides_0, weight = layers_10_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_41_cast_fp16)[name = tensor<string, []>("op_2031_cast_fp16")];`
1386	`tensor<string, []> var_2037_pad_type_0 = const()[name = tensor<string, []>("op_2037_pad_type_0"), val = tensor<string, []>("valid")];`
1387	`tensor<int32, [2]> var_2037_strides_0 = const()[name = tensor<string, []>("op_2037_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1388	`tensor<int32, [4]> var_2037_pad_0 = const()[name = tensor<string, []>("op_2037_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1389	`tensor<int32, [2]> var_2037_dilations_0 = const()[name = tensor<string, []>("op_2037_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1390	`tensor<int32, []> var_2037_groups_0 = const()[name = tensor<string, []>("op_2037_groups_0"), val = tensor<int32, []>(1)];`
1391	tensor<fp16, [768, 768, 1, 1]> layers_10_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(53657216))), name = tensor<string, []>("layers_10_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3358]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(53650432))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1392	`tensor<fp16, [1, 768, 1, 1500]> var_2037_cast_fp16 = conv(dilations = var_2037_dilations_0, groups = var_2037_groups_0, pad = var_2037_pad_0, pad_type = var_2037_pad_type_0, strides = var_2037_strides_0, weight = layers_10_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_41_cast_fp16)[name = tensor<string, []>("op_2037_cast_fp16")];`
1393	`tensor<fp16, [1, 768, 1, 1500]> key_21_cast_fp16 = add(x = var_2031_cast_fp16, y = var_2037_cast_fp16)[name = tensor<string, []>("key_21_cast_fp16")];`
1394	`tensor<string, []> var_2047_pad_type_0 = const()[name = tensor<string, []>("op_2047_pad_type_0"), val = tensor<string, []>("valid")];`
1395	`tensor<int32, [2]> var_2047_strides_0 = const()[name = tensor<string, []>("op_2047_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1396	`tensor<int32, [4]> var_2047_pad_0 = const()[name = tensor<string, []>("op_2047_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1397	`tensor<int32, [2]> var_2047_dilations_0 = const()[name = tensor<string, []>("op_2047_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1398	`tensor<int32, []> var_2047_groups_0 = const()[name = tensor<string, []>("op_2047_groups_0"), val = tensor<int32, []>(1)];`
1399	tensor<fp16, [768, 768, 1, 1]> layers_10_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(53731008))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54025984))), name = tensor<string, []>("layers_10_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1400	`tensor<fp16, [768]> layers_10_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_10_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54026112)))];`
1401	`tensor<fp16, [1, 768, 1, 1500]> var_2047_cast_fp16 = conv(bias = layers_10_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_2047_dilations_0, groups = var_2047_groups_0, pad = var_2047_pad_0, pad_type = var_2047_pad_type_0, strides = var_2047_strides_0, weight = layers_10_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_41_cast_fp16)[name = tensor<string, []>("op_2047_cast_fp16")];`
1402	`tensor<string, []> var_2053_pad_type_0 = const()[name = tensor<string, []>("op_2053_pad_type_0"), val = tensor<string, []>("valid")];`
1403	`tensor<int32, [2]> var_2053_strides_0 = const()[name = tensor<string, []>("op_2053_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1404	`tensor<int32, [4]> var_2053_pad_0 = const()[name = tensor<string, []>("op_2053_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1405	`tensor<int32, [2]> var_2053_dilations_0 = const()[name = tensor<string, []>("op_2053_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1406	`tensor<int32, []> var_2053_groups_0 = const()[name = tensor<string, []>("op_2053_groups_0"), val = tensor<int32, []>(1)];`
1407	tensor<fp16, [768, 768, 1, 1]> layers_10_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54033152))), name = tensor<string, []>("layers_10_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [2685]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54027712))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1408	`tensor<fp16, [1, 768, 1, 1500]> var_2053_cast_fp16 = conv(dilations = var_2053_dilations_0, groups = var_2053_groups_0, pad = var_2053_pad_0, pad_type = var_2053_pad_type_0, strides = var_2053_strides_0, weight = layers_10_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_41_cast_fp16)[name = tensor<string, []>("op_2053_cast_fp16")];`
1409	`tensor<fp16, [1, 768, 1, 1500]> value_21_cast_fp16 = add(x = var_2047_cast_fp16, y = var_2053_cast_fp16)[name = tensor<string, []>("value_21_cast_fp16")];`
1410	`tensor<int32, [4]> var_2057 = const()[name = tensor<string, []>("op_2057"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1411	`tensor<fp16, [1, 12, 64, 1500]> mh_q_21_cast_fp16 = reshape(shape = var_2057, x = query_21_cast_fp16)[name = tensor<string, []>("mh_q_21_cast_fp16")];`
1412	`tensor<fp16, []> var_2059_to_fp16 = const()[name = tensor<string, []>("op_2059_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
1413	`tensor<fp16, [1, 12, 64, 1500]> var_2060_cast_fp16 = mul(x = mh_q_21_cast_fp16, y = var_2059_to_fp16)[name = tensor<string, []>("op_2060_cast_fp16")];`
1414	`tensor<int32, [4]> var_2063 = const()[name = tensor<string, []>("op_2063"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1415	`tensor<fp16, [1, 12, 64, 1500]> var_2064_cast_fp16 = reshape(shape = var_2063, x = key_21_cast_fp16)[name = tensor<string, []>("op_2064_cast_fp16")];`
1416	`tensor<bool, []> mh_w_21_transpose_x_0 = const()[name = tensor<string, []>("mh_w_21_transpose_x_0"), val = tensor<bool, []>(true)];`
1417	`tensor<bool, []> mh_w_21_transpose_y_0 = const()[name = tensor<string, []>("mh_w_21_transpose_y_0"), val = tensor<bool, []>(false)];`
1418	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_21_cast_fp16 = matmul(transpose_x = mh_w_21_transpose_x_0, transpose_y = mh_w_21_transpose_y_0, x = var_2060_cast_fp16, y = var_2064_cast_fp16)[name = tensor<string, []>("mh_w_21_cast_fp16")];`
1419	`tensor<fp16, [1, 12, 1500, 1500]> var_2067_cast_fp16 = softmax(axis = var_1972, x = mh_w_21_cast_fp16)[name = tensor<string, []>("op_2067_cast_fp16")];`
1420	`tensor<int32, [4]> var_2068 = const()[name = tensor<string, []>("op_2068"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1421	`tensor<fp16, [1, 12, 64, 1500]> var_2069_cast_fp16 = reshape(shape = var_2068, x = value_21_cast_fp16)[name = tensor<string, []>("op_2069_cast_fp16")];`
1422	`tensor<bool, []> attn_21_transpose_x_0 = const()[name = tensor<string, []>("attn_21_transpose_x_0"), val = tensor<bool, []>(false)];`
1423	`tensor<bool, []> attn_21_transpose_y_0 = const()[name = tensor<string, []>("attn_21_transpose_y_0"), val = tensor<bool, []>(true)];`
1424	`tensor<fp16, [1, 12, 64, 1500]> attn_21_cast_fp16 = matmul(transpose_x = attn_21_transpose_x_0, transpose_y = attn_21_transpose_y_0, x = var_2069_cast_fp16, y = var_2067_cast_fp16)[name = tensor<string, []>("attn_21_cast_fp16")];`
1425	`tensor<int32, [4]> var_2072 = const()[name = tensor<string, []>("op_2072"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
1426	`tensor<fp16, [1, 768, 1, 1500]> input_81_cast_fp16 = reshape(shape = var_2072, x = attn_21_cast_fp16)[name = tensor<string, []>("input_81_cast_fp16")];`
1427	`tensor<string, []> var_2082_pad_type_0 = const()[name = tensor<string, []>("op_2082_pad_type_0"), val = tensor<string, []>("valid")];`
1428	`tensor<int32, [2]> var_2082_strides_0 = const()[name = tensor<string, []>("op_2082_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1429	`tensor<int32, [4]> var_2082_pad_0 = const()[name = tensor<string, []>("op_2082_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1430	`tensor<int32, [2]> var_2082_dilations_0 = const()[name = tensor<string, []>("op_2082_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1431	`tensor<int32, []> var_2082_groups_0 = const()[name = tensor<string, []>("op_2082_groups_0"), val = tensor<int32, []>(1)];`
1432	tensor<fp16, [768, 768, 1, 1]> layers_10_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54106944))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54401920))), name = tensor<string, []>("layers_10_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1433	`tensor<fp16, [768]> layers_10_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_10_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54402048)))];`
1434	`tensor<fp16, [1, 768, 1, 1500]> var_2082_cast_fp16 = conv(bias = layers_10_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_2082_dilations_0, groups = var_2082_groups_0, pad = var_2082_pad_0, pad_type = var_2082_pad_type_0, strides = var_2082_strides_0, weight = layers_10_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_81_cast_fp16)[name = tensor<string, []>("op_2082_cast_fp16")];`
1435	`tensor<string, []> var_2088_pad_type_0 = const()[name = tensor<string, []>("op_2088_pad_type_0"), val = tensor<string, []>("valid")];`
1436	`tensor<int32, [2]> var_2088_strides_0 = const()[name = tensor<string, []>("op_2088_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1437	`tensor<int32, [4]> var_2088_pad_0 = const()[name = tensor<string, []>("op_2088_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1438	`tensor<int32, [2]> var_2088_dilations_0 = const()[name = tensor<string, []>("op_2088_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1439	`tensor<int32, []> var_2088_groups_0 = const()[name = tensor<string, []>("op_2088_groups_0"), val = tensor<int32, []>(1)];`
1440	tensor<fp16, [768, 768, 1, 1]> layers_10_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54409472))), name = tensor<string, []>("layers_10_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [2866]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54403648))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1441	`tensor<fp16, [1, 768, 1, 1500]> var_2088_cast_fp16 = conv(dilations = var_2088_dilations_0, groups = var_2088_groups_0, pad = var_2088_pad_0, pad_type = var_2088_pad_type_0, strides = var_2088_strides_0, weight = layers_10_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_81_cast_fp16)[name = tensor<string, []>("op_2088_cast_fp16")];`
1442	`tensor<fp16, [1, 768, 1, 1500]> obj_43_cast_fp16 = add(x = var_2082_cast_fp16, y = var_2088_cast_fp16)[name = tensor<string, []>("obj_43_cast_fp16")];`
1443	`tensor<fp16, [1, 768, 1, 1500]> inputs_43_cast_fp16 = add(x = inputs_41_cast_fp16, y = obj_43_cast_fp16)[name = tensor<string, []>("inputs_43_cast_fp16")];`
1444	`tensor<int32, [1]> out_43_axes_0 = const()[name = tensor<string, []>("out_43_axes_0"), val = tensor<int32, [1]>([1])];`
1445	`tensor<fp16, []> var_2099_to_fp16 = const()[name = tensor<string, []>("op_2099_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1446	`tensor<fp16, [1, 768, 1, 1500]> out_43_cast_fp16 = layer_norm(axes = out_43_axes_0, epsilon = var_2099_to_fp16, x = inputs_43_cast_fp16)[name = tensor<string, []>("out_43_cast_fp16")];`
1447	`tensor<fp16, [768]> input_83_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_83_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54483264)))];`
1448	`tensor<fp16, [768]> input_83_beta_0_to_fp16 = const()[name = tensor<string, []>("input_83_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54484864)))];`
1449	`tensor<fp16, []> input_83_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_83_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1450	`tensor<fp16, [1, 768, 1, 1500]> input_83_cast_fp16 = batch_norm(beta = input_83_beta_0_to_fp16, epsilon = input_83_epsilon_0_to_fp16, gamma = input_83_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_43_cast_fp16)[name = tensor<string, []>("input_83_cast_fp16")];`
1451	`tensor<string, []> var_2117_pad_type_0 = const()[name = tensor<string, []>("op_2117_pad_type_0"), val = tensor<string, []>("valid")];`
1452	`tensor<int32, [2]> var_2117_strides_0 = const()[name = tensor<string, []>("op_2117_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1453	`tensor<int32, [4]> var_2117_pad_0 = const()[name = tensor<string, []>("op_2117_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1454	`tensor<int32, [2]> var_2117_dilations_0 = const()[name = tensor<string, []>("op_2117_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1455	`tensor<int32, []> var_2117_groups_0 = const()[name = tensor<string, []>("op_2117_groups_0"), val = tensor<int32, []>(1)];`
1456	tensor<fp16, [3072, 768, 1, 1]> layers_10_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(54486464))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(55666176))), name = tensor<string, []>("layers_10_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1457	`tensor<fp16, [3072]> layers_10_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_10_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(55666304)))];`
1458	`tensor<fp16, [1, 3072, 1, 1500]> var_2117_cast_fp16 = conv(bias = layers_10_fc1_inlier_module_bias_to_fp16, dilations = var_2117_dilations_0, groups = var_2117_groups_0, pad = var_2117_pad_0, pad_type = var_2117_pad_type_0, strides = var_2117_strides_0, weight = layers_10_fc1_inlier_module_weight_to_fp16_palettized, x = input_83_cast_fp16)[name = tensor<string, []>("op_2117_cast_fp16")];`
1459	`tensor<string, []> var_2123_pad_type_0 = const()[name = tensor<string, []>("op_2123_pad_type_0"), val = tensor<string, []>("valid")];`
1460	`tensor<int32, [2]> var_2123_strides_0 = const()[name = tensor<string, []>("op_2123_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1461	`tensor<int32, [4]> var_2123_pad_0 = const()[name = tensor<string, []>("op_2123_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1462	`tensor<int32, [2]> var_2123_dilations_0 = const()[name = tensor<string, []>("op_2123_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1463	`tensor<int32, []> var_2123_groups_0 = const()[name = tensor<string, []>("op_2123_groups_0"), val = tensor<int32, []>(1)];`
1464	tensor<fp16, [3072, 768, 1, 1]> layers_10_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(55704320))), name = tensor<string, []>("layers_10_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [15858]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(55672512))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1465	`tensor<fp16, [1, 3072, 1, 1500]> var_2123_cast_fp16 = conv(dilations = var_2123_dilations_0, groups = var_2123_groups_0, pad = var_2123_pad_0, pad_type = var_2123_pad_type_0, strides = var_2123_strides_0, weight = layers_10_fc1_outlier_module_weight_to_fp16_sparsified, x = input_83_cast_fp16)[name = tensor<string, []>("op_2123_cast_fp16")];`
1466	`tensor<fp16, [1, 3072, 1, 1500]> input_85_cast_fp16 = add(x = var_2117_cast_fp16, y = var_2123_cast_fp16)[name = tensor<string, []>("input_85_cast_fp16")];`
1467	`tensor<string, []> input_87_mode_0 = const()[name = tensor<string, []>("input_87_mode_0"), val = tensor<string, []>("EXACT")];`
1468	`tensor<fp16, [1, 3072, 1, 1500]> input_87_cast_fp16 = gelu(mode = input_87_mode_0, x = input_85_cast_fp16)[name = tensor<string, []>("input_87_cast_fp16")];`
1469	`tensor<string, []> var_2134_pad_type_0 = const()[name = tensor<string, []>("op_2134_pad_type_0"), val = tensor<string, []>("valid")];`
1470	`tensor<int32, [2]> var_2134_strides_0 = const()[name = tensor<string, []>("op_2134_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1471	`tensor<int32, [4]> var_2134_pad_0 = const()[name = tensor<string, []>("op_2134_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1472	`tensor<int32, [2]> var_2134_dilations_0 = const()[name = tensor<string, []>("op_2134_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1473	`tensor<int32, []> var_2134_groups_0 = const()[name = tensor<string, []>("op_2134_groups_0"), val = tensor<int32, []>(1)];`
1474	tensor<fp16, [768, 3072, 1, 1]> layers_10_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(55999296))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57179008))), name = tensor<string, []>("layers_10_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1475	`tensor<fp16, [768]> layers_10_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_10_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57179136)))];`
1476	`tensor<fp16, [1, 768, 1, 1500]> var_2134_cast_fp16 = conv(bias = layers_10_fc2_inlier_module_bias_to_fp16, dilations = var_2134_dilations_0, groups = var_2134_groups_0, pad = var_2134_pad_0, pad_type = var_2134_pad_type_0, strides = var_2134_strides_0, weight = layers_10_fc2_inlier_module_weight_to_fp16_palettized, x = input_87_cast_fp16)[name = tensor<string, []>("op_2134_cast_fp16")];`
1477	`tensor<string, []> var_2140_pad_type_0 = const()[name = tensor<string, []>("op_2140_pad_type_0"), val = tensor<string, []>("valid")];`
1478	`tensor<int32, [2]> var_2140_strides_0 = const()[name = tensor<string, []>("op_2140_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1479	`tensor<int32, [4]> var_2140_pad_0 = const()[name = tensor<string, []>("op_2140_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1480	`tensor<int32, [2]> var_2140_dilations_0 = const()[name = tensor<string, []>("op_2140_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1481	`tensor<int32, []> var_2140_groups_0 = const()[name = tensor<string, []>("op_2140_groups_0"), val = tensor<int32, []>(1)];`
1482	tensor<fp16, [768, 3072, 1, 1]> layers_10_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57215232))), name = tensor<string, []>("layers_10_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [17216]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57180736))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1483	`tensor<fp16, [1, 768, 1, 1500]> var_2140_cast_fp16 = conv(dilations = var_2140_dilations_0, groups = var_2140_groups_0, pad = var_2140_pad_0, pad_type = var_2140_pad_type_0, strides = var_2140_strides_0, weight = layers_10_fc2_outlier_module_weight_to_fp16_sparsified, x = input_87_cast_fp16)[name = tensor<string, []>("op_2140_cast_fp16")];`
1484	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_25_cast_fp16 = add(x = var_2134_cast_fp16, y = var_2140_cast_fp16)[name = tensor<string, []>("hidden_states_25_cast_fp16")];`
1485	`tensor<fp16, [1, 768, 1, 1500]> inputs_45_cast_fp16 = add(x = inputs_43_cast_fp16, y = hidden_states_25_cast_fp16)[name = tensor<string, []>("inputs_45_cast_fp16")];`
1486	`tensor<int32, []> var_2146 = const()[name = tensor<string, []>("op_2146"), val = tensor<int32, []>(3)];`
1487	`tensor<int32, [1]> out_45_axes_0 = const()[name = tensor<string, []>("out_45_axes_0"), val = tensor<int32, [1]>([1])];`
1488	`tensor<fp16, []> var_2168_to_fp16 = const()[name = tensor<string, []>("op_2168_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1489	`tensor<fp16, [1, 768, 1, 1500]> out_45_cast_fp16 = layer_norm(axes = out_45_axes_0, epsilon = var_2168_to_fp16, x = inputs_45_cast_fp16)[name = tensor<string, []>("out_45_cast_fp16")];`
1490	`tensor<fp16, [768]> obj_45_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_45_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57510208)))];`
1491	`tensor<fp16, [768]> obj_45_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_45_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57511808)))];`
1492	`tensor<fp16, []> obj_45_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_45_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1493	`tensor<fp16, [1, 768, 1, 1500]> obj_45_cast_fp16 = batch_norm(beta = obj_45_beta_0_to_fp16, epsilon = obj_45_epsilon_0_to_fp16, gamma = obj_45_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_45_cast_fp16)[name = tensor<string, []>("obj_45_cast_fp16")];`
1494	`tensor<string, []> var_2190_pad_type_0 = const()[name = tensor<string, []>("op_2190_pad_type_0"), val = tensor<string, []>("valid")];`
1495	`tensor<int32, [2]> var_2190_strides_0 = const()[name = tensor<string, []>("op_2190_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1496	`tensor<int32, [4]> var_2190_pad_0 = const()[name = tensor<string, []>("op_2190_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1497	`tensor<int32, [2]> var_2190_dilations_0 = const()[name = tensor<string, []>("op_2190_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1498	`tensor<int32, []> var_2190_groups_0 = const()[name = tensor<string, []>("op_2190_groups_0"), val = tensor<int32, []>(1)];`
1499	tensor<fp16, [768, 768, 1, 1]> layers_11_self_attn_q_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57513408))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57808384))), name = tensor<string, []>("layers_11_self_attn_q_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1500	`tensor<fp16, [768]> layers_11_self_attn_q_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_11_self_attn_q_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57808512)))];`
1501	`tensor<fp16, [1, 768, 1, 1500]> var_2190_cast_fp16 = conv(bias = layers_11_self_attn_q_proj_inlier_module_bias_to_fp16, dilations = var_2190_dilations_0, groups = var_2190_groups_0, pad = var_2190_pad_0, pad_type = var_2190_pad_type_0, strides = var_2190_strides_0, weight = layers_11_self_attn_q_proj_inlier_module_weight_to_fp16_palettized, x = obj_45_cast_fp16)[name = tensor<string, []>("op_2190_cast_fp16")];`
1502	`tensor<string, []> var_2196_pad_type_0 = const()[name = tensor<string, []>("op_2196_pad_type_0"), val = tensor<string, []>("valid")];`
1503	`tensor<int32, [2]> var_2196_strides_0 = const()[name = tensor<string, []>("op_2196_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1504	`tensor<int32, [4]> var_2196_pad_0 = const()[name = tensor<string, []>("op_2196_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1505	`tensor<int32, [2]> var_2196_dilations_0 = const()[name = tensor<string, []>("op_2196_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1506	`tensor<int32, []> var_2196_groups_0 = const()[name = tensor<string, []>("op_2196_groups_0"), val = tensor<int32, []>(1)];`
1507	tensor<fp16, [768, 768, 1, 1]> layers_11_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57816768))), name = tensor<string, []>("layers_11_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3283]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57810112))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1508	`tensor<fp16, [1, 768, 1, 1500]> var_2196_cast_fp16 = conv(dilations = var_2196_dilations_0, groups = var_2196_groups_0, pad = var_2196_pad_0, pad_type = var_2196_pad_type_0, strides = var_2196_strides_0, weight = layers_11_self_attn_q_proj_outlier_module_weight_to_fp16_sparsified, x = obj_45_cast_fp16)[name = tensor<string, []>("op_2196_cast_fp16")];`
1509	`tensor<fp16, [1, 768, 1, 1500]> query_cast_fp16 = add(x = var_2190_cast_fp16, y = var_2196_cast_fp16)[name = tensor<string, []>("query_cast_fp16")];`
1510	`tensor<string, []> var_2205_pad_type_0 = const()[name = tensor<string, []>("op_2205_pad_type_0"), val = tensor<string, []>("valid")];`
1511	`tensor<int32, [2]> var_2205_strides_0 = const()[name = tensor<string, []>("op_2205_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1512	`tensor<int32, [4]> var_2205_pad_0 = const()[name = tensor<string, []>("op_2205_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1513	`tensor<int32, [2]> var_2205_dilations_0 = const()[name = tensor<string, []>("op_2205_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1514	`tensor<int32, []> var_2205_groups_0 = const()[name = tensor<string, []>("op_2205_groups_0"), val = tensor<int32, []>(1)];`
1515	tensor<fp16, [768, 768, 1, 1]> layers_11_self_attn_k_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(57890560))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58185536))), name = tensor<string, []>("layers_11_self_attn_k_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1516	`tensor<fp16, [1, 768, 1, 1500]> var_2205_cast_fp16 = conv(dilations = var_2205_dilations_0, groups = var_2205_groups_0, pad = var_2205_pad_0, pad_type = var_2205_pad_type_0, strides = var_2205_strides_0, weight = layers_11_self_attn_k_proj_inlier_module_weight_to_fp16_palettized, x = obj_45_cast_fp16)[name = tensor<string, []>("op_2205_cast_fp16")];`
1517	`tensor<string, []> var_2211_pad_type_0 = const()[name = tensor<string, []>("op_2211_pad_type_0"), val = tensor<string, []>("valid")];`
1518	`tensor<int32, [2]> var_2211_strides_0 = const()[name = tensor<string, []>("op_2211_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1519	`tensor<int32, [4]> var_2211_pad_0 = const()[name = tensor<string, []>("op_2211_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1520	`tensor<int32, [2]> var_2211_dilations_0 = const()[name = tensor<string, []>("op_2211_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1521	`tensor<int32, []> var_2211_groups_0 = const()[name = tensor<string, []>("op_2211_groups_0"), val = tensor<int32, []>(1)];`
1522	tensor<fp16, [768, 768, 1, 1]> layers_11_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58192896))), name = tensor<string, []>("layers_11_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3584]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58185664))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1523	`tensor<fp16, [1, 768, 1, 1500]> var_2211_cast_fp16 = conv(dilations = var_2211_dilations_0, groups = var_2211_groups_0, pad = var_2211_pad_0, pad_type = var_2211_pad_type_0, strides = var_2211_strides_0, weight = layers_11_self_attn_k_proj_outlier_module_weight_to_fp16_sparsified, x = obj_45_cast_fp16)[name = tensor<string, []>("op_2211_cast_fp16")];`
1524	`tensor<fp16, [1, 768, 1, 1500]> key_cast_fp16 = add(x = var_2205_cast_fp16, y = var_2211_cast_fp16)[name = tensor<string, []>("key_cast_fp16")];`
1525	`tensor<string, []> var_2221_pad_type_0 = const()[name = tensor<string, []>("op_2221_pad_type_0"), val = tensor<string, []>("valid")];`
1526	`tensor<int32, [2]> var_2221_strides_0 = const()[name = tensor<string, []>("op_2221_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1527	`tensor<int32, [4]> var_2221_pad_0 = const()[name = tensor<string, []>("op_2221_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1528	`tensor<int32, [2]> var_2221_dilations_0 = const()[name = tensor<string, []>("op_2221_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1529	`tensor<int32, []> var_2221_groups_0 = const()[name = tensor<string, []>("op_2221_groups_0"), val = tensor<int32, []>(1)];`
1530	tensor<fp16, [768, 768, 1, 1]> layers_11_self_attn_v_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58266688))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58561664))), name = tensor<string, []>("layers_11_self_attn_v_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1531	`tensor<fp16, [768]> layers_11_self_attn_v_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_11_self_attn_v_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58561792)))];`
1532	`tensor<fp16, [1, 768, 1, 1500]> var_2221_cast_fp16 = conv(bias = layers_11_self_attn_v_proj_inlier_module_bias_to_fp16, dilations = var_2221_dilations_0, groups = var_2221_groups_0, pad = var_2221_pad_0, pad_type = var_2221_pad_type_0, strides = var_2221_strides_0, weight = layers_11_self_attn_v_proj_inlier_module_weight_to_fp16_palettized, x = obj_45_cast_fp16)[name = tensor<string, []>("op_2221_cast_fp16")];`
1533	`tensor<string, []> var_2227_pad_type_0 = const()[name = tensor<string, []>("op_2227_pad_type_0"), val = tensor<string, []>("valid")];`
1534	`tensor<int32, [2]> var_2227_strides_0 = const()[name = tensor<string, []>("op_2227_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1535	`tensor<int32, [4]> var_2227_pad_0 = const()[name = tensor<string, []>("op_2227_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1536	`tensor<int32, [2]> var_2227_dilations_0 = const()[name = tensor<string, []>("op_2227_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1537	`tensor<int32, []> var_2227_groups_0 = const()[name = tensor<string, []>("op_2227_groups_0"), val = tensor<int32, []>(1)];`
1538	tensor<fp16, [768, 768, 1, 1]> layers_11_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58569728))), name = tensor<string, []>("layers_11_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3113]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58563392))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1539	`tensor<fp16, [1, 768, 1, 1500]> var_2227_cast_fp16 = conv(dilations = var_2227_dilations_0, groups = var_2227_groups_0, pad = var_2227_pad_0, pad_type = var_2227_pad_type_0, strides = var_2227_strides_0, weight = layers_11_self_attn_v_proj_outlier_module_weight_to_fp16_sparsified, x = obj_45_cast_fp16)[name = tensor<string, []>("op_2227_cast_fp16")];`
1540	`tensor<fp16, [1, 768, 1, 1500]> value_cast_fp16 = add(x = var_2221_cast_fp16, y = var_2227_cast_fp16)[name = tensor<string, []>("value_cast_fp16")];`
1541	`tensor<int32, [4]> var_2231 = const()[name = tensor<string, []>("op_2231"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1542	`tensor<fp16, [1, 12, 64, 1500]> mh_q_cast_fp16 = reshape(shape = var_2231, x = query_cast_fp16)[name = tensor<string, []>("mh_q_cast_fp16")];`
1543	`tensor<fp16, []> var_2233_to_fp16 = const()[name = tensor<string, []>("op_2233_to_fp16"), val = tensor<fp16, []>(0x1p-3)];`
1544	`tensor<fp16, [1, 12, 64, 1500]> var_2234_cast_fp16 = mul(x = mh_q_cast_fp16, y = var_2233_to_fp16)[name = tensor<string, []>("op_2234_cast_fp16")];`
1545	`tensor<int32, [4]> var_2237 = const()[name = tensor<string, []>("op_2237"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1546	`tensor<fp16, [1, 12, 64, 1500]> var_2238_cast_fp16 = reshape(shape = var_2237, x = key_cast_fp16)[name = tensor<string, []>("op_2238_cast_fp16")];`
1547	`tensor<bool, []> mh_w_transpose_x_0 = const()[name = tensor<string, []>("mh_w_transpose_x_0"), val = tensor<bool, []>(true)];`
1548	`tensor<bool, []> mh_w_transpose_y_0 = const()[name = tensor<string, []>("mh_w_transpose_y_0"), val = tensor<bool, []>(false)];`
1549	`tensor<fp16, [1, 12, 1500, 1500]> mh_w_cast_fp16 = matmul(transpose_x = mh_w_transpose_x_0, transpose_y = mh_w_transpose_y_0, x = var_2234_cast_fp16, y = var_2238_cast_fp16)[name = tensor<string, []>("mh_w_cast_fp16")];`
1550	`tensor<fp16, [1, 12, 1500, 1500]> var_2241_cast_fp16 = softmax(axis = var_2146, x = mh_w_cast_fp16)[name = tensor<string, []>("op_2241_cast_fp16")];`
1551	`tensor<int32, [4]> var_2242 = const()[name = tensor<string, []>("op_2242"), val = tensor<int32, [4]>([1, 12, 64, 1500])];`
1552	`tensor<fp16, [1, 12, 64, 1500]> var_2243_cast_fp16 = reshape(shape = var_2242, x = value_cast_fp16)[name = tensor<string, []>("op_2243_cast_fp16")];`
1553	`tensor<bool, []> attn_transpose_x_0 = const()[name = tensor<string, []>("attn_transpose_x_0"), val = tensor<bool, []>(false)];`
1554	`tensor<bool, []> attn_transpose_y_0 = const()[name = tensor<string, []>("attn_transpose_y_0"), val = tensor<bool, []>(true)];`
1555	`tensor<fp16, [1, 12, 64, 1500]> attn_cast_fp16 = matmul(transpose_x = attn_transpose_x_0, transpose_y = attn_transpose_y_0, x = var_2243_cast_fp16, y = var_2241_cast_fp16)[name = tensor<string, []>("attn_cast_fp16")];`
1556	`tensor<int32, [4]> var_2246 = const()[name = tensor<string, []>("op_2246"), val = tensor<int32, [4]>([1, 768, 1, 1500])];`
1557	`tensor<fp16, [1, 768, 1, 1500]> input_89_cast_fp16 = reshape(shape = var_2246, x = attn_cast_fp16)[name = tensor<string, []>("input_89_cast_fp16")];`
1558	`tensor<string, []> var_2256_pad_type_0 = const()[name = tensor<string, []>("op_2256_pad_type_0"), val = tensor<string, []>("valid")];`
1559	`tensor<int32, [2]> var_2256_strides_0 = const()[name = tensor<string, []>("op_2256_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1560	`tensor<int32, [4]> var_2256_pad_0 = const()[name = tensor<string, []>("op_2256_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1561	`tensor<int32, [2]> var_2256_dilations_0 = const()[name = tensor<string, []>("op_2256_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1562	`tensor<int32, []> var_2256_groups_0 = const()[name = tensor<string, []>("op_2256_groups_0"), val = tensor<int32, []>(1)];`
1563	tensor<fp16, [768, 768, 1, 1]> layers_11_self_attn_o_proj_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58643520))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58938496))), name = tensor<string, []>("layers_11_self_attn_o_proj_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1564	`tensor<fp16, [768]> layers_11_self_attn_o_proj_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_11_self_attn_o_proj_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58938624)))];`
1565	`tensor<fp16, [1, 768, 1, 1500]> var_2256_cast_fp16 = conv(bias = layers_11_self_attn_o_proj_inlier_module_bias_to_fp16, dilations = var_2256_dilations_0, groups = var_2256_groups_0, pad = var_2256_pad_0, pad_type = var_2256_pad_type_0, strides = var_2256_strides_0, weight = layers_11_self_attn_o_proj_inlier_module_weight_to_fp16_palettized, x = input_89_cast_fp16)[name = tensor<string, []>("op_2256_cast_fp16")];`
1566	`tensor<string, []> var_2262_pad_type_0 = const()[name = tensor<string, []>("op_2262_pad_type_0"), val = tensor<string, []>("valid")];`
1567	`tensor<int32, [2]> var_2262_strides_0 = const()[name = tensor<string, []>("op_2262_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1568	`tensor<int32, [4]> var_2262_pad_0 = const()[name = tensor<string, []>("op_2262_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1569	`tensor<int32, [2]> var_2262_dilations_0 = const()[name = tensor<string, []>("op_2262_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1570	`tensor<int32, []> var_2262_groups_0 = const()[name = tensor<string, []>("op_2262_groups_0"), val = tensor<int32, []>(1)];`
1571	tensor<fp16, [768, 768, 1, 1]> layers_11_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [73728]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58947520))), name = tensor<string, []>("layers_11_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [3613]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(58940224))), shape = tensor<uint32, [4]>([768, 768, 1, 1])];
1572	`tensor<fp16, [1, 768, 1, 1500]> var_2262_cast_fp16 = conv(dilations = var_2262_dilations_0, groups = var_2262_groups_0, pad = var_2262_pad_0, pad_type = var_2262_pad_type_0, strides = var_2262_strides_0, weight = layers_11_self_attn_o_proj_outlier_module_weight_to_fp16_sparsified, x = input_89_cast_fp16)[name = tensor<string, []>("op_2262_cast_fp16")];`
1573	`tensor<fp16, [1, 768, 1, 1500]> obj_cast_fp16 = add(x = var_2256_cast_fp16, y = var_2262_cast_fp16)[name = tensor<string, []>("obj_cast_fp16")];`
1574	`tensor<fp16, [1, 768, 1, 1500]> inputs_47_cast_fp16 = add(x = inputs_45_cast_fp16, y = obj_cast_fp16)[name = tensor<string, []>("inputs_47_cast_fp16")];`
1575	`tensor<int32, [1]> out_47_axes_0 = const()[name = tensor<string, []>("out_47_axes_0"), val = tensor<int32, [1]>([1])];`
1576	`tensor<fp16, []> var_2273_to_fp16 = const()[name = tensor<string, []>("op_2273_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1577	`tensor<fp16, [1, 768, 1, 1500]> out_47_cast_fp16 = layer_norm(axes = out_47_axes_0, epsilon = var_2273_to_fp16, x = inputs_47_cast_fp16)[name = tensor<string, []>("out_47_cast_fp16")];`
1578	`tensor<fp16, [768]> input_91_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_91_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(59021312)))];`
1579	`tensor<fp16, [768]> input_91_beta_0_to_fp16 = const()[name = tensor<string, []>("input_91_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(59022912)))];`
1580	`tensor<fp16, []> input_91_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_91_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1581	`tensor<fp16, [1, 768, 1, 1500]> input_91_cast_fp16 = batch_norm(beta = input_91_beta_0_to_fp16, epsilon = input_91_epsilon_0_to_fp16, gamma = input_91_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_47_cast_fp16)[name = tensor<string, []>("input_91_cast_fp16")];`
1582	`tensor<string, []> var_2291_pad_type_0 = const()[name = tensor<string, []>("op_2291_pad_type_0"), val = tensor<string, []>("valid")];`
1583	`tensor<int32, [2]> var_2291_strides_0 = const()[name = tensor<string, []>("op_2291_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1584	`tensor<int32, [4]> var_2291_pad_0 = const()[name = tensor<string, []>("op_2291_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1585	`tensor<int32, [2]> var_2291_dilations_0 = const()[name = tensor<string, []>("op_2291_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1586	`tensor<int32, []> var_2291_groups_0 = const()[name = tensor<string, []>("op_2291_groups_0"), val = tensor<int32, []>(1)];`
1587	tensor<fp16, [3072, 768, 1, 1]> layers_11_fc1_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(59024512))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(60204224))), name = tensor<string, []>("layers_11_fc1_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1588	`tensor<fp16, [3072]> layers_11_fc1_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_11_fc1_inlier_module_bias_to_fp16"), val = tensor<fp16, [3072]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(60204352)))];`
1589	`tensor<fp16, [1, 3072, 1, 1500]> var_2291_cast_fp16 = conv(bias = layers_11_fc1_inlier_module_bias_to_fp16, dilations = var_2291_dilations_0, groups = var_2291_groups_0, pad = var_2291_pad_0, pad_type = var_2291_pad_type_0, strides = var_2291_strides_0, weight = layers_11_fc1_inlier_module_weight_to_fp16_palettized, x = input_91_cast_fp16)[name = tensor<string, []>("op_2291_cast_fp16")];`
1590	`tensor<string, []> var_2297_pad_type_0 = const()[name = tensor<string, []>("op_2297_pad_type_0"), val = tensor<string, []>("valid")];`
1591	`tensor<int32, [2]> var_2297_strides_0 = const()[name = tensor<string, []>("op_2297_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1592	`tensor<int32, [4]> var_2297_pad_0 = const()[name = tensor<string, []>("op_2297_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1593	`tensor<int32, [2]> var_2297_dilations_0 = const()[name = tensor<string, []>("op_2297_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1594	`tensor<int32, []> var_2297_groups_0 = const()[name = tensor<string, []>("op_2297_groups_0"), val = tensor<int32, []>(1)];`
1595	tensor<fp16, [3072, 768, 1, 1]> layers_11_fc1_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(60241728))), name = tensor<string, []>("layers_11_fc1_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [15540]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(60210560))), shape = tensor<uint32, [4]>([3072, 768, 1, 1])];
1596	`tensor<fp16, [1, 3072, 1, 1500]> var_2297_cast_fp16 = conv(dilations = var_2297_dilations_0, groups = var_2297_groups_0, pad = var_2297_pad_0, pad_type = var_2297_pad_type_0, strides = var_2297_strides_0, weight = layers_11_fc1_outlier_module_weight_to_fp16_sparsified, x = input_91_cast_fp16)[name = tensor<string, []>("op_2297_cast_fp16")];`
1597	`tensor<fp16, [1, 3072, 1, 1500]> input_93_cast_fp16 = add(x = var_2291_cast_fp16, y = var_2297_cast_fp16)[name = tensor<string, []>("input_93_cast_fp16")];`
1598	`tensor<string, []> input_mode_0 = const()[name = tensor<string, []>("input_mode_0"), val = tensor<string, []>("EXACT")];`
1599	`tensor<fp16, [1, 3072, 1, 1500]> input_cast_fp16 = gelu(mode = input_mode_0, x = input_93_cast_fp16)[name = tensor<string, []>("input_cast_fp16")];`
1600	`tensor<string, []> var_2308_pad_type_0 = const()[name = tensor<string, []>("op_2308_pad_type_0"), val = tensor<string, []>("valid")];`
1601	`tensor<int32, [2]> var_2308_strides_0 = const()[name = tensor<string, []>("op_2308_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1602	`tensor<int32, [4]> var_2308_pad_0 = const()[name = tensor<string, []>("op_2308_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1603	`tensor<int32, [2]> var_2308_dilations_0 = const()[name = tensor<string, []>("op_2308_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1604	`tensor<int32, []> var_2308_groups_0 = const()[name = tensor<string, []>("op_2308_groups_0"), val = tensor<int32, []>(1)];`
1605	tensor<fp16, [768, 3072, 1, 1]> layers_11_fc2_inlier_module_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor<uint8, [1179648]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(60536704))), lut = tensor<fp16, [16]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(61716416))), name = tensor<string, []>("layers_11_fc2_inlier_module_weight_to_fp16_palettized"), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1606	`tensor<fp16, [768]> layers_11_fc2_inlier_module_bias_to_fp16 = const()[name = tensor<string, []>("layers_11_fc2_inlier_module_bias_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(61716544)))];`
1607	`tensor<fp16, [1, 768, 1, 1500]> var_2308_cast_fp16 = conv(bias = layers_11_fc2_inlier_module_bias_to_fp16, dilations = var_2308_dilations_0, groups = var_2308_groups_0, pad = var_2308_pad_0, pad_type = var_2308_pad_type_0, strides = var_2308_strides_0, weight = layers_11_fc2_inlier_module_weight_to_fp16_palettized, x = input_cast_fp16)[name = tensor<string, []>("op_2308_cast_fp16")];`
1608	`tensor<string, []> var_2314_pad_type_0 = const()[name = tensor<string, []>("op_2314_pad_type_0"), val = tensor<string, []>("valid")];`
1609	`tensor<int32, [2]> var_2314_strides_0 = const()[name = tensor<string, []>("op_2314_strides_0"), val = tensor<int32, [2]>([1, 1])];`
1610	`tensor<int32, [4]> var_2314_pad_0 = const()[name = tensor<string, []>("op_2314_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];`
1611	`tensor<int32, [2]> var_2314_dilations_0 = const()[name = tensor<string, []>("op_2314_dilations_0"), val = tensor<int32, [2]>([1, 1])];`
1612	`tensor<int32, []> var_2314_groups_0 = const()[name = tensor<string, []>("op_2314_groups_0"), val = tensor<int32, []>(1)];`
1613	tensor<fp16, [768, 3072, 1, 1]> layers_11_fc2_outlier_module_weight_to_fp16_sparsified = constexpr_sparse_to_dense()[mask = tensor<uint8, [294912]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(61753984))), name = tensor<string, []>("layers_11_fc2_outlier_module_weight_to_fp16_sparsified"), nonzero_data = tensor<fp16, [17871]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(61718144))), shape = tensor<uint32, [4]>([768, 3072, 1, 1])];
1614	`tensor<fp16, [1, 768, 1, 1500]> var_2314_cast_fp16 = conv(dilations = var_2314_dilations_0, groups = var_2314_groups_0, pad = var_2314_pad_0, pad_type = var_2314_pad_type_0, strides = var_2314_strides_0, weight = layers_11_fc2_outlier_module_weight_to_fp16_sparsified, x = input_cast_fp16)[name = tensor<string, []>("op_2314_cast_fp16")];`
1615	`tensor<fp16, [1, 768, 1, 1500]> hidden_states_cast_fp16 = add(x = var_2308_cast_fp16, y = var_2314_cast_fp16)[name = tensor<string, []>("hidden_states_cast_fp16")];`
1616	`tensor<fp16, [1, 768, 1, 1500]> inputs_cast_fp16 = add(x = inputs_47_cast_fp16, y = hidden_states_cast_fp16)[name = tensor<string, []>("inputs_cast_fp16")];`
1617	`tensor<int32, [1]> out_axes_0 = const()[name = tensor<string, []>("out_axes_0"), val = tensor<int32, [1]>([1])];`
1618	`tensor<fp16, []> var_2329_to_fp16 = const()[name = tensor<string, []>("op_2329_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1619	`tensor<fp16, [1, 768, 1, 1500]> out_cast_fp16 = layer_norm(axes = out_axes_0, epsilon = var_2329_to_fp16, x = inputs_cast_fp16)[name = tensor<string, []>("out_cast_fp16")];`
1620	`tensor<fp16, [768]> encoder_output_embeds_type_fp32_gamma_0_to_fp16 = const()[name = tensor<string, []>("encoder_output_embeds_type_fp32_gamma_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(62048960)))];`
1621	`tensor<fp16, [768]> encoder_output_embeds_type_fp32_beta_0_to_fp16 = const()[name = tensor<string, []>("encoder_output_embeds_type_fp32_beta_0_to_fp16"), val = tensor<fp16, [768]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(62050560)))];`
1622	`tensor<fp16, []> encoder_output_embeds_type_fp32_epsilon_0_to_fp16 = const()[name = tensor<string, []>("encoder_output_embeds_type_fp32_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];`
1623	`tensor<fp16, [1, 768, 1, 1500]> encoder_output_embeds = batch_norm(beta = encoder_output_embeds_type_fp32_beta_0_to_fp16, epsilon = encoder_output_embeds_type_fp32_epsilon_0_to_fp16, gamma = encoder_output_embeds_type_fp32_gamma_0_to_fp16, mean = var_57_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_cast_fp16)[name = tensor<string, []>("encoder_output_embeds_type_fp32_cast_fp16")];`
1624	`} -> (encoder_output_embeds);`
1625	`}`