File size: 405,178 Bytes

b8f21db

program(1.0)
[buildInfo = dict<tensor<string, []>, tensor<string, []>>({{"coremlc-component-MIL", "3304.5.2"}, {"coremlc-version", "3304.6.2"}, {"coremltools-component-torch", "2.2.1"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "7.1"}})]
{
    func main<ios16>(tensor<fp16, [1, 77]> attention_mask, tensor<int32, [1, 77]> input_ids) {
            tensor<int32, []> x_1_axis_0 = const()[name = tensor<string, []>("x_1_axis_0"), val = tensor<int32, []>(0)];
            tensor<int32, []> x_1_batch_dims_0 = const()[name = tensor<string, []>("x_1_batch_dims_0"), val = tensor<int32, []>(0)];
            tensor<fp16, [32128, 4096]> embed_tokens_weight_to_fp16 = const()[name = tensor<string, []>("embed_tokens_weight_to_fp16"), val = tensor<fp16, [32128, 4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(64)))];
            tensor<fp16, [1, 77, 4096]> x_1_cast_fp16 = gather(axis = x_1_axis_0, batch_dims = x_1_batch_dims_0, indices = input_ids, x = embed_tokens_weight_to_fp16)[name = tensor<string, []>("x_1_cast_fp16")];
            tensor<int32, [3]> var_60_perm_0 = const()[name = tensor<string, []>("op_60_perm_0"), val = tensor<int32, [3]>([0, 2, 1])];
            tensor<int32, [1]> inputs_1_axes_0 = const()[name = tensor<string, []>("inputs_1_axes_0"), val = tensor<int32, [1]>([2])];
            tensor<fp16, [1, 4096, 77]> transpose_0 = transpose(perm = var_60_perm_0, x = x_1_cast_fp16)[name = tensor<string, []>("transpose_0")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_1_cast_fp16 = expand_dims(axes = inputs_1_axes_0, x = transpose_0)[name = tensor<string, []>("inputs_1_cast_fp16")];
            tensor<bool, []> var_66 = const()[name = tensor<string, []>("op_66"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_67 = const()[name = tensor<string, []>("op_67"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_71 = const()[name = tensor<string, []>("op_71"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_69_to_fp16 = const()[name = tensor<string, []>("op_69_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_68_to_fp16 = const()[name = tensor<string, []>("op_68_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_3_cast_fp16 = clip(alpha = var_69_to_fp16, beta = var_68_to_fp16, x = inputs_1_cast_fp16)[name = tensor<string, []>("inputs_3_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_1_cast_fp16 = mul(x = inputs_3_cast_fp16, y = inputs_3_cast_fp16)[name = tensor<string, []>("inputs_sq_1_cast_fp16")];
            tensor<int32, [1]> var_88 = const()[name = tensor<string, []>("op_88"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_1_cast_fp16 = reduce_mean(axes = var_88, keep_dims = var_66, x = inputs_sq_1_cast_fp16)[name = tensor<string, []>("variance_1_cast_fp16")];
            tensor<fp16, []> var_90_to_fp16 = const()[name = tensor<string, []>("op_90_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_91_cast_fp16 = add(x = variance_1_cast_fp16, y = var_90_to_fp16)[name = tensor<string, []>("op_91_cast_fp16")];
            tensor<fp16, []> var_92_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_92_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_92_cast_fp16 = rsqrt(epsilon = var_92_epsilon_0_to_fp16, x = var_91_cast_fp16)[name = tensor<string, []>("op_92_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_1_cast_fp16 = mul(x = inputs_3_cast_fp16, y = var_92_cast_fp16)[name = tensor<string, []>("hidden_states_1_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_1_to_fp16 = const()[name = tensor<string, []>("w_1_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(263192704)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_1_cast_fp16 = mul(x = w_1_to_fp16, y = hidden_states_1_cast_fp16)[name = tensor<string, []>("obj_1_cast_fp16")];
            tensor<int32, [2]> var_106 = const()[name = tensor<string, []>("op_106"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_108 = const()[name = tensor<string, []>("op_108"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_1_pad_type_0 = const()[name = tensor<string, []>("query_1_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_1_pad_0 = const()[name = tensor<string, []>("query_1_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_0_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_0_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(263200960)))];
            tensor<fp16, [4096]> block_0_layer_0_SelfAttention_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("block_0_layer_0_SelfAttention_q_proj_bias_to_fp16"), val = tensor<fp16, [4096]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(296755456)))];
            tensor<fp16, [1, 4096, 1, 77]> query_1_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_108, groups = var_67, pad = query_1_pad_0, pad_type = query_1_pad_type_0, strides = var_106, weight = block_0_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_1_cast_fp16)[name = tensor<string, []>("query_1_cast_fp16")];
            tensor<int32, [2]> var_112 = const()[name = tensor<string, []>("op_112"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_114 = const()[name = tensor<string, []>("op_114"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_1_pad_type_0 = const()[name = tensor<string, []>("key_1_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_1_pad_0 = const()[name = tensor<string, []>("key_1_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_0_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_0_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(296763712)))];
            tensor<fp16, [1, 4096, 1, 77]> key_1_cast_fp16 = conv(dilations = var_114, groups = var_67, pad = key_1_pad_0, pad_type = key_1_pad_type_0, strides = var_112, weight = block_0_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_1_cast_fp16)[name = tensor<string, []>("key_1_cast_fp16")];
            tensor<int32, [2]> var_119 = const()[name = tensor<string, []>("op_119"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_121 = const()[name = tensor<string, []>("op_121"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_1_pad_type_0 = const()[name = tensor<string, []>("value_1_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_1_pad_0 = const()[name = tensor<string, []>("value_1_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_0_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_0_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(330318208)))];
            tensor<fp16, [1, 4096, 1, 77]> value_1_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_121, groups = var_67, pad = value_1_pad_0, pad_type = value_1_pad_type_0, strides = var_119, weight = block_0_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_1_cast_fp16)[name = tensor<string, []>("value_1_cast_fp16")];
            tensor<int32, [4]> var_125 = const()[name = tensor<string, []>("op_125"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_126_cast_fp16 = reshape(shape = var_125, x = query_1_cast_fp16)[name = tensor<string, []>("op_126_cast_fp16")];
            tensor<int32, [4]> var_127 = const()[name = tensor<string, []>("op_127"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_128_cast_fp16 = reshape(shape = var_127, x = key_1_cast_fp16)[name = tensor<string, []>("op_128_cast_fp16")];
            tensor<bool, []> mh_w_1_transpose_x_0 = const()[name = tensor<string, []>("mh_w_1_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_1_transpose_y_0 = const()[name = tensor<string, []>("mh_w_1_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_1_cast_fp16 = matmul(transpose_x = mh_w_1_transpose_x_0, transpose_y = mh_w_1_transpose_y_0, x = var_126_cast_fp16, y = var_128_cast_fp16)[name = tensor<string, []>("mh_w_1_cast_fp16")];
            tensor<int32, [1]> var_132_axes_0 = const()[name = tensor<string, []>("op_132_axes_0"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 77]> var_132_cast_fp16 = expand_dims(axes = var_132_axes_0, x = attention_mask)[name = tensor<string, []>("op_132_cast_fp16")];
            tensor<int32, [1]> var_133_axes_0 = const()[name = tensor<string, []>("op_133_axes_0"), val = tensor<int32, [1]>([2])];
            tensor<fp16, [1, 1, 1, 77]> var_133_cast_fp16 = expand_dims(axes = var_133_axes_0, x = var_132_cast_fp16)[name = tensor<string, []>("op_133_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_3_cast_fp16 = add(x = mh_w_1_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_3_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> relative_attention_bias_to_fp16 = const()[name = tensor<string, []>("relative_attention_bias_to_fp16"), val = tensor<fp16, [1, 64, 77, 77]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(363872704)))];
            tensor<fp16, [1, 64, 77, 77]> mh_w_5_cast_fp16 = add(x = mh_w_3_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_5_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_137_cast_fp16 = softmax(axis = var_71, x = mh_w_5_cast_fp16)[name = tensor<string, []>("op_137_cast_fp16")];
            tensor<int32, [4]> var_138 = const()[name = tensor<string, []>("op_138"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_139_cast_fp16 = reshape(shape = var_138, x = value_1_cast_fp16)[name = tensor<string, []>("op_139_cast_fp16")];
            tensor<bool, []> attn_1_transpose_x_0 = const()[name = tensor<string, []>("attn_1_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_1_transpose_y_0 = const()[name = tensor<string, []>("attn_1_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_1_cast_fp16 = matmul(transpose_x = attn_1_transpose_x_0, transpose_y = attn_1_transpose_y_0, x = var_139_cast_fp16, y = var_137_cast_fp16)[name = tensor<string, []>("attn_1_cast_fp16")];
            tensor<int32, [4]> var_142 = const()[name = tensor<string, []>("op_142"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_1_cast_fp16 = reshape(shape = var_142, x = attn_1_cast_fp16)[name = tensor<string, []>("input_1_cast_fp16")];
            tensor<int32, [2]> var_146 = const()[name = tensor<string, []>("op_146"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_148 = const()[name = tensor<string, []>("op_148"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_5_pad_type_0 = const()[name = tensor<string, []>("obj_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_5_pad_0 = const()[name = tensor<string, []>("obj_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_0_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_0_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(364631680)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_5_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_148, groups = var_67, pad = obj_5_pad_0, pad_type = obj_5_pad_type_0, strides = var_146, weight = block_0_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_1_cast_fp16)[name = tensor<string, []>("obj_5_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_5_cast_fp16 = add(x = inputs_3_cast_fp16, y = obj_5_cast_fp16)[name = tensor<string, []>("inputs_5_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_7_cast_fp16 = clip(alpha = var_69_to_fp16, beta = var_68_to_fp16, x = inputs_5_cast_fp16)[name = tensor<string, []>("inputs_7_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_3_cast_fp16 = mul(x = inputs_7_cast_fp16, y = inputs_7_cast_fp16)[name = tensor<string, []>("inputs_sq_3_cast_fp16")];
            tensor<int32, [1]> var_157 = const()[name = tensor<string, []>("op_157"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_3_cast_fp16 = reduce_mean(axes = var_157, keep_dims = var_66, x = inputs_sq_3_cast_fp16)[name = tensor<string, []>("variance_3_cast_fp16")];
            tensor<fp16, []> var_159_to_fp16 = const()[name = tensor<string, []>("op_159_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_160_cast_fp16 = add(x = variance_3_cast_fp16, y = var_159_to_fp16)[name = tensor<string, []>("op_160_cast_fp16")];
            tensor<fp16, []> var_161_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_161_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_161_cast_fp16 = rsqrt(epsilon = var_161_epsilon_0_to_fp16, x = var_160_cast_fp16)[name = tensor<string, []>("op_161_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_3_cast_fp16 = mul(x = inputs_7_cast_fp16, y = var_161_cast_fp16)[name = tensor<string, []>("hidden_states_3_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_3_to_fp16 = const()[name = tensor<string, []>("w_3_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(398186176)))];
            tensor<fp16, [1, 4096, 1, 77]> input_3_cast_fp16 = mul(x = w_3_to_fp16, y = hidden_states_3_cast_fp16)[name = tensor<string, []>("input_3_cast_fp16")];
            tensor<int32, [2]> var_174 = const()[name = tensor<string, []>("op_174"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_176 = const()[name = tensor<string, []>("op_176"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_3_pad_type_0 = const()[name = tensor<string, []>("x_3_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_3_pad_0 = const()[name = tensor<string, []>("x_3_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_0_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_0_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(398194432)))];
            tensor<fp16, [10240]> block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16 = const()[name = tensor<string, []>("block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16"), val = tensor<fp16, [10240]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(482080576)))];
            tensor<fp16, [1, 10240, 1, 77]> x_3_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_176, groups = var_67, pad = x_3_pad_0, pad_type = x_3_pad_type_0, strides = var_174, weight = block_0_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_3_cast_fp16)[name = tensor<string, []>("x_3_cast_fp16")];
            tensor<string, []> var_190_mode_0 = const()[name = tensor<string, []>("op_190_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_190_cast_fp16 = gelu(mode = var_190_mode_0, x = x_3_cast_fp16)[name = tensor<string, []>("op_190_cast_fp16")];
            tensor<int32, [2]> var_193 = const()[name = tensor<string, []>("op_193"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_195 = const()[name = tensor<string, []>("op_195"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_197_pad_type_0 = const()[name = tensor<string, []>("op_197_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_197_pad_0 = const()[name = tensor<string, []>("op_197_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_0_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_0_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(482101120)))];
            tensor<fp16, [1, 10240, 1, 77]> var_197_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_195, groups = var_67, pad = var_197_pad_0, pad_type = var_197_pad_type_0, strides = var_193, weight = block_0_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_3_cast_fp16)[name = tensor<string, []>("op_197_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_5_cast_fp16 = mul(x = var_190_cast_fp16, y = var_197_cast_fp16)[name = tensor<string, []>("input_5_cast_fp16")];
            tensor<int32, [2]> var_201 = const()[name = tensor<string, []>("op_201"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_203 = const()[name = tensor<string, []>("op_203"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_205_pad_type_0 = const()[name = tensor<string, []>("op_205_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_205_pad_0 = const()[name = tensor<string, []>("op_205_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_0_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_0_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(565987264)))];
            tensor<fp16, [1, 4096, 1, 77]> var_205_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_203, groups = var_67, pad = var_205_pad_0, pad_type = var_205_pad_type_0, strides = var_201, weight = block_0_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_5_cast_fp16)[name = tensor<string, []>("op_205_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_9_cast_fp16 = add(x = inputs_7_cast_fp16, y = var_205_cast_fp16)[name = tensor<string, []>("inputs_9_cast_fp16")];
            tensor<bool, []> var_210 = const()[name = tensor<string, []>("op_210"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_211 = const()[name = tensor<string, []>("op_211"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_215 = const()[name = tensor<string, []>("op_215"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_213_to_fp16 = const()[name = tensor<string, []>("op_213_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_212_to_fp16 = const()[name = tensor<string, []>("op_212_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_11_cast_fp16 = clip(alpha = var_213_to_fp16, beta = var_212_to_fp16, x = inputs_9_cast_fp16)[name = tensor<string, []>("inputs_11_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_5_cast_fp16 = mul(x = inputs_11_cast_fp16, y = inputs_11_cast_fp16)[name = tensor<string, []>("inputs_sq_5_cast_fp16")];
            tensor<int32, [1]> var_232 = const()[name = tensor<string, []>("op_232"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_5_cast_fp16 = reduce_mean(axes = var_232, keep_dims = var_210, x = inputs_sq_5_cast_fp16)[name = tensor<string, []>("variance_5_cast_fp16")];
            tensor<fp16, []> var_234_to_fp16 = const()[name = tensor<string, []>("op_234_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_235_cast_fp16 = add(x = variance_5_cast_fp16, y = var_234_to_fp16)[name = tensor<string, []>("op_235_cast_fp16")];
            tensor<fp16, []> var_236_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_236_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_236_cast_fp16 = rsqrt(epsilon = var_236_epsilon_0_to_fp16, x = var_235_cast_fp16)[name = tensor<string, []>("op_236_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_5_cast_fp16 = mul(x = inputs_11_cast_fp16, y = var_236_cast_fp16)[name = tensor<string, []>("hidden_states_5_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_5_to_fp16 = const()[name = tensor<string, []>("w_5_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(649873408)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_7_cast_fp16 = mul(x = w_5_to_fp16, y = hidden_states_5_cast_fp16)[name = tensor<string, []>("obj_7_cast_fp16")];
            tensor<int32, [2]> var_250 = const()[name = tensor<string, []>("op_250"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_252 = const()[name = tensor<string, []>("op_252"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_3_pad_type_0 = const()[name = tensor<string, []>("query_3_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_3_pad_0 = const()[name = tensor<string, []>("query_3_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_1_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_1_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(649881664)))];
            tensor<fp16, [1, 4096, 1, 77]> query_3_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_252, groups = var_211, pad = query_3_pad_0, pad_type = query_3_pad_type_0, strides = var_250, weight = block_1_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_7_cast_fp16)[name = tensor<string, []>("query_3_cast_fp16")];
            tensor<int32, [2]> var_256 = const()[name = tensor<string, []>("op_256"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_258 = const()[name = tensor<string, []>("op_258"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_3_pad_type_0 = const()[name = tensor<string, []>("key_3_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_3_pad_0 = const()[name = tensor<string, []>("key_3_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_1_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_1_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(683436160)))];
            tensor<fp16, [1, 4096, 1, 77]> key_3_cast_fp16 = conv(dilations = var_258, groups = var_211, pad = key_3_pad_0, pad_type = key_3_pad_type_0, strides = var_256, weight = block_1_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_7_cast_fp16)[name = tensor<string, []>("key_3_cast_fp16")];
            tensor<int32, [2]> var_263 = const()[name = tensor<string, []>("op_263"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_265 = const()[name = tensor<string, []>("op_265"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_3_pad_type_0 = const()[name = tensor<string, []>("value_3_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_3_pad_0 = const()[name = tensor<string, []>("value_3_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_1_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_1_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(716990656)))];
            tensor<fp16, [1, 4096, 1, 77]> value_3_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_265, groups = var_211, pad = value_3_pad_0, pad_type = value_3_pad_type_0, strides = var_263, weight = block_1_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_7_cast_fp16)[name = tensor<string, []>("value_3_cast_fp16")];
            tensor<int32, [4]> var_269 = const()[name = tensor<string, []>("op_269"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_270_cast_fp16 = reshape(shape = var_269, x = query_3_cast_fp16)[name = tensor<string, []>("op_270_cast_fp16")];
            tensor<int32, [4]> var_271 = const()[name = tensor<string, []>("op_271"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_272_cast_fp16 = reshape(shape = var_271, x = key_3_cast_fp16)[name = tensor<string, []>("op_272_cast_fp16")];
            tensor<bool, []> mh_w_7_transpose_x_0 = const()[name = tensor<string, []>("mh_w_7_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_7_transpose_y_0 = const()[name = tensor<string, []>("mh_w_7_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_7_cast_fp16 = matmul(transpose_x = mh_w_7_transpose_x_0, transpose_y = mh_w_7_transpose_y_0, x = var_270_cast_fp16, y = var_272_cast_fp16)[name = tensor<string, []>("mh_w_7_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_9_cast_fp16 = add(x = mh_w_7_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_9_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_11_cast_fp16 = add(x = mh_w_9_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_11_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_281_cast_fp16 = softmax(axis = var_215, x = mh_w_11_cast_fp16)[name = tensor<string, []>("op_281_cast_fp16")];
            tensor<int32, [4]> var_282 = const()[name = tensor<string, []>("op_282"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_283_cast_fp16 = reshape(shape = var_282, x = value_3_cast_fp16)[name = tensor<string, []>("op_283_cast_fp16")];
            tensor<bool, []> attn_3_transpose_x_0 = const()[name = tensor<string, []>("attn_3_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_3_transpose_y_0 = const()[name = tensor<string, []>("attn_3_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_3_cast_fp16 = matmul(transpose_x = attn_3_transpose_x_0, transpose_y = attn_3_transpose_y_0, x = var_283_cast_fp16, y = var_281_cast_fp16)[name = tensor<string, []>("attn_3_cast_fp16")];
            tensor<int32, [4]> var_286 = const()[name = tensor<string, []>("op_286"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_7_cast_fp16 = reshape(shape = var_286, x = attn_3_cast_fp16)[name = tensor<string, []>("input_7_cast_fp16")];
            tensor<int32, [2]> var_290 = const()[name = tensor<string, []>("op_290"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_292 = const()[name = tensor<string, []>("op_292"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_9_pad_type_0 = const()[name = tensor<string, []>("obj_9_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_9_pad_0 = const()[name = tensor<string, []>("obj_9_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_1_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_1_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(750545152)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_9_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_292, groups = var_211, pad = obj_9_pad_0, pad_type = obj_9_pad_type_0, strides = var_290, weight = block_1_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_7_cast_fp16)[name = tensor<string, []>("obj_9_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_13_cast_fp16 = add(x = inputs_11_cast_fp16, y = obj_9_cast_fp16)[name = tensor<string, []>("inputs_13_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_15_cast_fp16 = clip(alpha = var_213_to_fp16, beta = var_212_to_fp16, x = inputs_13_cast_fp16)[name = tensor<string, []>("inputs_15_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_7_cast_fp16 = mul(x = inputs_15_cast_fp16, y = inputs_15_cast_fp16)[name = tensor<string, []>("inputs_sq_7_cast_fp16")];
            tensor<int32, [1]> var_301 = const()[name = tensor<string, []>("op_301"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_7_cast_fp16 = reduce_mean(axes = var_301, keep_dims = var_210, x = inputs_sq_7_cast_fp16)[name = tensor<string, []>("variance_7_cast_fp16")];
            tensor<fp16, []> var_303_to_fp16 = const()[name = tensor<string, []>("op_303_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_304_cast_fp16 = add(x = variance_7_cast_fp16, y = var_303_to_fp16)[name = tensor<string, []>("op_304_cast_fp16")];
            tensor<fp16, []> var_305_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_305_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_305_cast_fp16 = rsqrt(epsilon = var_305_epsilon_0_to_fp16, x = var_304_cast_fp16)[name = tensor<string, []>("op_305_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_7_cast_fp16 = mul(x = inputs_15_cast_fp16, y = var_305_cast_fp16)[name = tensor<string, []>("hidden_states_7_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_7_to_fp16 = const()[name = tensor<string, []>("w_7_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(784099648)))];
            tensor<fp16, [1, 4096, 1, 77]> input_9_cast_fp16 = mul(x = w_7_to_fp16, y = hidden_states_7_cast_fp16)[name = tensor<string, []>("input_9_cast_fp16")];
            tensor<int32, [2]> var_318 = const()[name = tensor<string, []>("op_318"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_320 = const()[name = tensor<string, []>("op_320"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_5_pad_type_0 = const()[name = tensor<string, []>("x_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_5_pad_0 = const()[name = tensor<string, []>("x_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_1_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_1_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(784107904)))];
            tensor<fp16, [1, 10240, 1, 77]> x_5_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_320, groups = var_211, pad = x_5_pad_0, pad_type = x_5_pad_type_0, strides = var_318, weight = block_1_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_9_cast_fp16)[name = tensor<string, []>("x_5_cast_fp16")];
            tensor<string, []> var_334_mode_0 = const()[name = tensor<string, []>("op_334_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_334_cast_fp16 = gelu(mode = var_334_mode_0, x = x_5_cast_fp16)[name = tensor<string, []>("op_334_cast_fp16")];
            tensor<int32, [2]> var_337 = const()[name = tensor<string, []>("op_337"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_339 = const()[name = tensor<string, []>("op_339"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_341_pad_type_0 = const()[name = tensor<string, []>("op_341_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_341_pad_0 = const()[name = tensor<string, []>("op_341_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_1_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_1_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(867994048)))];
            tensor<fp16, [1, 10240, 1, 77]> var_341_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_339, groups = var_211, pad = var_341_pad_0, pad_type = var_341_pad_type_0, strides = var_337, weight = block_1_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_9_cast_fp16)[name = tensor<string, []>("op_341_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_11_cast_fp16 = mul(x = var_334_cast_fp16, y = var_341_cast_fp16)[name = tensor<string, []>("input_11_cast_fp16")];
            tensor<int32, [2]> var_345 = const()[name = tensor<string, []>("op_345"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_347 = const()[name = tensor<string, []>("op_347"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_349_pad_type_0 = const()[name = tensor<string, []>("op_349_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_349_pad_0 = const()[name = tensor<string, []>("op_349_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_1_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_1_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(951880192)))];
            tensor<fp16, [1, 4096, 1, 77]> var_349_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_347, groups = var_211, pad = var_349_pad_0, pad_type = var_349_pad_type_0, strides = var_345, weight = block_1_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_11_cast_fp16)[name = tensor<string, []>("op_349_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_17_cast_fp16 = add(x = inputs_15_cast_fp16, y = var_349_cast_fp16)[name = tensor<string, []>("inputs_17_cast_fp16")];
            tensor<bool, []> var_354 = const()[name = tensor<string, []>("op_354"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_355 = const()[name = tensor<string, []>("op_355"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_359 = const()[name = tensor<string, []>("op_359"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_357_to_fp16 = const()[name = tensor<string, []>("op_357_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_356_to_fp16 = const()[name = tensor<string, []>("op_356_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_19_cast_fp16 = clip(alpha = var_357_to_fp16, beta = var_356_to_fp16, x = inputs_17_cast_fp16)[name = tensor<string, []>("inputs_19_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_9_cast_fp16 = mul(x = inputs_19_cast_fp16, y = inputs_19_cast_fp16)[name = tensor<string, []>("inputs_sq_9_cast_fp16")];
            tensor<int32, [1]> var_376 = const()[name = tensor<string, []>("op_376"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_9_cast_fp16 = reduce_mean(axes = var_376, keep_dims = var_354, x = inputs_sq_9_cast_fp16)[name = tensor<string, []>("variance_9_cast_fp16")];
            tensor<fp16, []> var_378_to_fp16 = const()[name = tensor<string, []>("op_378_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_379_cast_fp16 = add(x = variance_9_cast_fp16, y = var_378_to_fp16)[name = tensor<string, []>("op_379_cast_fp16")];
            tensor<fp16, []> var_380_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_380_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_380_cast_fp16 = rsqrt(epsilon = var_380_epsilon_0_to_fp16, x = var_379_cast_fp16)[name = tensor<string, []>("op_380_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_9_cast_fp16 = mul(x = inputs_19_cast_fp16, y = var_380_cast_fp16)[name = tensor<string, []>("hidden_states_9_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_9_to_fp16 = const()[name = tensor<string, []>("w_9_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1035766336)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_11_cast_fp16 = mul(x = w_9_to_fp16, y = hidden_states_9_cast_fp16)[name = tensor<string, []>("obj_11_cast_fp16")];
            tensor<int32, [2]> var_394 = const()[name = tensor<string, []>("op_394"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_396 = const()[name = tensor<string, []>("op_396"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_5_pad_type_0 = const()[name = tensor<string, []>("query_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_5_pad_0 = const()[name = tensor<string, []>("query_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_2_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_2_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1035774592)))];
            tensor<fp16, [1, 4096, 1, 77]> query_5_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_396, groups = var_355, pad = query_5_pad_0, pad_type = query_5_pad_type_0, strides = var_394, weight = block_2_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_11_cast_fp16)[name = tensor<string, []>("query_5_cast_fp16")];
            tensor<int32, [2]> var_400 = const()[name = tensor<string, []>("op_400"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_402 = const()[name = tensor<string, []>("op_402"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_5_pad_type_0 = const()[name = tensor<string, []>("key_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_5_pad_0 = const()[name = tensor<string, []>("key_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_2_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_2_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1069329088)))];
            tensor<fp16, [1, 4096, 1, 77]> key_5_cast_fp16 = conv(dilations = var_402, groups = var_355, pad = key_5_pad_0, pad_type = key_5_pad_type_0, strides = var_400, weight = block_2_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_11_cast_fp16)[name = tensor<string, []>("key_5_cast_fp16")];
            tensor<int32, [2]> var_407 = const()[name = tensor<string, []>("op_407"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_409 = const()[name = tensor<string, []>("op_409"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_5_pad_type_0 = const()[name = tensor<string, []>("value_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_5_pad_0 = const()[name = tensor<string, []>("value_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_2_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_2_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1102883584)))];
            tensor<fp16, [1, 4096, 1, 77]> value_5_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_409, groups = var_355, pad = value_5_pad_0, pad_type = value_5_pad_type_0, strides = var_407, weight = block_2_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_11_cast_fp16)[name = tensor<string, []>("value_5_cast_fp16")];
            tensor<int32, [4]> var_413 = const()[name = tensor<string, []>("op_413"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_414_cast_fp16 = reshape(shape = var_413, x = query_5_cast_fp16)[name = tensor<string, []>("op_414_cast_fp16")];
            tensor<int32, [4]> var_415 = const()[name = tensor<string, []>("op_415"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_416_cast_fp16 = reshape(shape = var_415, x = key_5_cast_fp16)[name = tensor<string, []>("op_416_cast_fp16")];
            tensor<bool, []> mh_w_13_transpose_x_0 = const()[name = tensor<string, []>("mh_w_13_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_13_transpose_y_0 = const()[name = tensor<string, []>("mh_w_13_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_13_cast_fp16 = matmul(transpose_x = mh_w_13_transpose_x_0, transpose_y = mh_w_13_transpose_y_0, x = var_414_cast_fp16, y = var_416_cast_fp16)[name = tensor<string, []>("mh_w_13_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_15_cast_fp16 = add(x = mh_w_13_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_15_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_17_cast_fp16 = add(x = mh_w_15_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_17_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_425_cast_fp16 = softmax(axis = var_359, x = mh_w_17_cast_fp16)[name = tensor<string, []>("op_425_cast_fp16")];
            tensor<int32, [4]> var_426 = const()[name = tensor<string, []>("op_426"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_427_cast_fp16 = reshape(shape = var_426, x = value_5_cast_fp16)[name = tensor<string, []>("op_427_cast_fp16")];
            tensor<bool, []> attn_5_transpose_x_0 = const()[name = tensor<string, []>("attn_5_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_5_transpose_y_0 = const()[name = tensor<string, []>("attn_5_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_5_cast_fp16 = matmul(transpose_x = attn_5_transpose_x_0, transpose_y = attn_5_transpose_y_0, x = var_427_cast_fp16, y = var_425_cast_fp16)[name = tensor<string, []>("attn_5_cast_fp16")];
            tensor<int32, [4]> var_430 = const()[name = tensor<string, []>("op_430"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_13_cast_fp16 = reshape(shape = var_430, x = attn_5_cast_fp16)[name = tensor<string, []>("input_13_cast_fp16")];
            tensor<int32, [2]> var_434 = const()[name = tensor<string, []>("op_434"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_436 = const()[name = tensor<string, []>("op_436"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_13_pad_type_0 = const()[name = tensor<string, []>("obj_13_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_13_pad_0 = const()[name = tensor<string, []>("obj_13_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_2_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_2_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1136438080)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_13_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_436, groups = var_355, pad = obj_13_pad_0, pad_type = obj_13_pad_type_0, strides = var_434, weight = block_2_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_13_cast_fp16)[name = tensor<string, []>("obj_13_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_21_cast_fp16 = add(x = inputs_19_cast_fp16, y = obj_13_cast_fp16)[name = tensor<string, []>("inputs_21_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_23_cast_fp16 = clip(alpha = var_357_to_fp16, beta = var_356_to_fp16, x = inputs_21_cast_fp16)[name = tensor<string, []>("inputs_23_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_11_cast_fp16 = mul(x = inputs_23_cast_fp16, y = inputs_23_cast_fp16)[name = tensor<string, []>("inputs_sq_11_cast_fp16")];
            tensor<int32, [1]> var_445 = const()[name = tensor<string, []>("op_445"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_11_cast_fp16 = reduce_mean(axes = var_445, keep_dims = var_354, x = inputs_sq_11_cast_fp16)[name = tensor<string, []>("variance_11_cast_fp16")];
            tensor<fp16, []> var_447_to_fp16 = const()[name = tensor<string, []>("op_447_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_448_cast_fp16 = add(x = variance_11_cast_fp16, y = var_447_to_fp16)[name = tensor<string, []>("op_448_cast_fp16")];
            tensor<fp16, []> var_449_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_449_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_449_cast_fp16 = rsqrt(epsilon = var_449_epsilon_0_to_fp16, x = var_448_cast_fp16)[name = tensor<string, []>("op_449_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_11_cast_fp16 = mul(x = inputs_23_cast_fp16, y = var_449_cast_fp16)[name = tensor<string, []>("hidden_states_11_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_11_to_fp16 = const()[name = tensor<string, []>("w_11_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1169992576)))];
            tensor<fp16, [1, 4096, 1, 77]> input_15_cast_fp16 = mul(x = w_11_to_fp16, y = hidden_states_11_cast_fp16)[name = tensor<string, []>("input_15_cast_fp16")];
            tensor<int32, [2]> var_462 = const()[name = tensor<string, []>("op_462"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_464 = const()[name = tensor<string, []>("op_464"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_7_pad_type_0 = const()[name = tensor<string, []>("x_7_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_7_pad_0 = const()[name = tensor<string, []>("x_7_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_2_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_2_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1170000832)))];
            tensor<fp16, [1, 10240, 1, 77]> x_7_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_464, groups = var_355, pad = x_7_pad_0, pad_type = x_7_pad_type_0, strides = var_462, weight = block_2_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_15_cast_fp16)[name = tensor<string, []>("x_7_cast_fp16")];
            tensor<string, []> var_478_mode_0 = const()[name = tensor<string, []>("op_478_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_478_cast_fp16 = gelu(mode = var_478_mode_0, x = x_7_cast_fp16)[name = tensor<string, []>("op_478_cast_fp16")];
            tensor<int32, [2]> var_481 = const()[name = tensor<string, []>("op_481"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_483 = const()[name = tensor<string, []>("op_483"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_485_pad_type_0 = const()[name = tensor<string, []>("op_485_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_485_pad_0 = const()[name = tensor<string, []>("op_485_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_2_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_2_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1253886976)))];
            tensor<fp16, [1, 10240, 1, 77]> var_485_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_483, groups = var_355, pad = var_485_pad_0, pad_type = var_485_pad_type_0, strides = var_481, weight = block_2_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_15_cast_fp16)[name = tensor<string, []>("op_485_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_17_cast_fp16 = mul(x = var_478_cast_fp16, y = var_485_cast_fp16)[name = tensor<string, []>("input_17_cast_fp16")];
            tensor<int32, [2]> var_489 = const()[name = tensor<string, []>("op_489"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_491 = const()[name = tensor<string, []>("op_491"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_493_pad_type_0 = const()[name = tensor<string, []>("op_493_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_493_pad_0 = const()[name = tensor<string, []>("op_493_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_2_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_2_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1337773120)))];
            tensor<fp16, [1, 4096, 1, 77]> var_493_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_491, groups = var_355, pad = var_493_pad_0, pad_type = var_493_pad_type_0, strides = var_489, weight = block_2_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_17_cast_fp16)[name = tensor<string, []>("op_493_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_25_cast_fp16 = add(x = inputs_23_cast_fp16, y = var_493_cast_fp16)[name = tensor<string, []>("inputs_25_cast_fp16")];
            tensor<bool, []> var_498 = const()[name = tensor<string, []>("op_498"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_499 = const()[name = tensor<string, []>("op_499"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_503 = const()[name = tensor<string, []>("op_503"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_501_to_fp16 = const()[name = tensor<string, []>("op_501_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_500_to_fp16 = const()[name = tensor<string, []>("op_500_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_27_cast_fp16 = clip(alpha = var_501_to_fp16, beta = var_500_to_fp16, x = inputs_25_cast_fp16)[name = tensor<string, []>("inputs_27_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_13_cast_fp16 = mul(x = inputs_27_cast_fp16, y = inputs_27_cast_fp16)[name = tensor<string, []>("inputs_sq_13_cast_fp16")];
            tensor<int32, [1]> var_520 = const()[name = tensor<string, []>("op_520"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_13_cast_fp16 = reduce_mean(axes = var_520, keep_dims = var_498, x = inputs_sq_13_cast_fp16)[name = tensor<string, []>("variance_13_cast_fp16")];
            tensor<fp16, []> var_522_to_fp16 = const()[name = tensor<string, []>("op_522_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_523_cast_fp16 = add(x = variance_13_cast_fp16, y = var_522_to_fp16)[name = tensor<string, []>("op_523_cast_fp16")];
            tensor<fp16, []> var_524_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_524_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_524_cast_fp16 = rsqrt(epsilon = var_524_epsilon_0_to_fp16, x = var_523_cast_fp16)[name = tensor<string, []>("op_524_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_13_cast_fp16 = mul(x = inputs_27_cast_fp16, y = var_524_cast_fp16)[name = tensor<string, []>("hidden_states_13_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_13_to_fp16 = const()[name = tensor<string, []>("w_13_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1421659264)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_15_cast_fp16 = mul(x = w_13_to_fp16, y = hidden_states_13_cast_fp16)[name = tensor<string, []>("obj_15_cast_fp16")];
            tensor<int32, [2]> var_538 = const()[name = tensor<string, []>("op_538"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_540 = const()[name = tensor<string, []>("op_540"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_7_pad_type_0 = const()[name = tensor<string, []>("query_7_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_7_pad_0 = const()[name = tensor<string, []>("query_7_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_3_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_3_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1421667520)))];
            tensor<fp16, [1, 4096, 1, 77]> query_7_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_540, groups = var_499, pad = query_7_pad_0, pad_type = query_7_pad_type_0, strides = var_538, weight = block_3_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_15_cast_fp16)[name = tensor<string, []>("query_7_cast_fp16")];
            tensor<int32, [2]> var_544 = const()[name = tensor<string, []>("op_544"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_546 = const()[name = tensor<string, []>("op_546"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_7_pad_type_0 = const()[name = tensor<string, []>("key_7_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_7_pad_0 = const()[name = tensor<string, []>("key_7_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_3_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_3_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1455222016)))];
            tensor<fp16, [1, 4096, 1, 77]> key_7_cast_fp16 = conv(dilations = var_546, groups = var_499, pad = key_7_pad_0, pad_type = key_7_pad_type_0, strides = var_544, weight = block_3_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_15_cast_fp16)[name = tensor<string, []>("key_7_cast_fp16")];
            tensor<int32, [2]> var_551 = const()[name = tensor<string, []>("op_551"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_553 = const()[name = tensor<string, []>("op_553"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_7_pad_type_0 = const()[name = tensor<string, []>("value_7_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_7_pad_0 = const()[name = tensor<string, []>("value_7_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_3_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_3_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1488776512)))];
            tensor<fp16, [1, 4096, 1, 77]> value_7_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_553, groups = var_499, pad = value_7_pad_0, pad_type = value_7_pad_type_0, strides = var_551, weight = block_3_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_15_cast_fp16)[name = tensor<string, []>("value_7_cast_fp16")];
            tensor<int32, [4]> var_557 = const()[name = tensor<string, []>("op_557"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_558_cast_fp16 = reshape(shape = var_557, x = query_7_cast_fp16)[name = tensor<string, []>("op_558_cast_fp16")];
            tensor<int32, [4]> var_559 = const()[name = tensor<string, []>("op_559"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_560_cast_fp16 = reshape(shape = var_559, x = key_7_cast_fp16)[name = tensor<string, []>("op_560_cast_fp16")];
            tensor<bool, []> mh_w_19_transpose_x_0 = const()[name = tensor<string, []>("mh_w_19_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_19_transpose_y_0 = const()[name = tensor<string, []>("mh_w_19_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_19_cast_fp16 = matmul(transpose_x = mh_w_19_transpose_x_0, transpose_y = mh_w_19_transpose_y_0, x = var_558_cast_fp16, y = var_560_cast_fp16)[name = tensor<string, []>("mh_w_19_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_21_cast_fp16 = add(x = mh_w_19_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_21_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_23_cast_fp16 = add(x = mh_w_21_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_23_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_569_cast_fp16 = softmax(axis = var_503, x = mh_w_23_cast_fp16)[name = tensor<string, []>("op_569_cast_fp16")];
            tensor<int32, [4]> var_570 = const()[name = tensor<string, []>("op_570"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_571_cast_fp16 = reshape(shape = var_570, x = value_7_cast_fp16)[name = tensor<string, []>("op_571_cast_fp16")];
            tensor<bool, []> attn_7_transpose_x_0 = const()[name = tensor<string, []>("attn_7_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_7_transpose_y_0 = const()[name = tensor<string, []>("attn_7_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_7_cast_fp16 = matmul(transpose_x = attn_7_transpose_x_0, transpose_y = attn_7_transpose_y_0, x = var_571_cast_fp16, y = var_569_cast_fp16)[name = tensor<string, []>("attn_7_cast_fp16")];
            tensor<int32, [4]> var_574 = const()[name = tensor<string, []>("op_574"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_19_cast_fp16 = reshape(shape = var_574, x = attn_7_cast_fp16)[name = tensor<string, []>("input_19_cast_fp16")];
            tensor<int32, [2]> var_578 = const()[name = tensor<string, []>("op_578"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_580 = const()[name = tensor<string, []>("op_580"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_17_pad_type_0 = const()[name = tensor<string, []>("obj_17_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_17_pad_0 = const()[name = tensor<string, []>("obj_17_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_3_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_3_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1522331008)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_17_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_580, groups = var_499, pad = obj_17_pad_0, pad_type = obj_17_pad_type_0, strides = var_578, weight = block_3_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_19_cast_fp16)[name = tensor<string, []>("obj_17_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_29_cast_fp16 = add(x = inputs_27_cast_fp16, y = obj_17_cast_fp16)[name = tensor<string, []>("inputs_29_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_31_cast_fp16 = clip(alpha = var_501_to_fp16, beta = var_500_to_fp16, x = inputs_29_cast_fp16)[name = tensor<string, []>("inputs_31_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_15_cast_fp16 = mul(x = inputs_31_cast_fp16, y = inputs_31_cast_fp16)[name = tensor<string, []>("inputs_sq_15_cast_fp16")];
            tensor<int32, [1]> var_589 = const()[name = tensor<string, []>("op_589"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_15_cast_fp16 = reduce_mean(axes = var_589, keep_dims = var_498, x = inputs_sq_15_cast_fp16)[name = tensor<string, []>("variance_15_cast_fp16")];
            tensor<fp16, []> var_591_to_fp16 = const()[name = tensor<string, []>("op_591_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_592_cast_fp16 = add(x = variance_15_cast_fp16, y = var_591_to_fp16)[name = tensor<string, []>("op_592_cast_fp16")];
            tensor<fp16, []> var_593_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_593_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_593_cast_fp16 = rsqrt(epsilon = var_593_epsilon_0_to_fp16, x = var_592_cast_fp16)[name = tensor<string, []>("op_593_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_15_cast_fp16 = mul(x = inputs_31_cast_fp16, y = var_593_cast_fp16)[name = tensor<string, []>("hidden_states_15_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_15_to_fp16 = const()[name = tensor<string, []>("w_15_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1555885504)))];
            tensor<fp16, [1, 4096, 1, 77]> input_21_cast_fp16 = mul(x = w_15_to_fp16, y = hidden_states_15_cast_fp16)[name = tensor<string, []>("input_21_cast_fp16")];
            tensor<int32, [2]> var_606 = const()[name = tensor<string, []>("op_606"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_608 = const()[name = tensor<string, []>("op_608"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_9_pad_type_0 = const()[name = tensor<string, []>("x_9_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_9_pad_0 = const()[name = tensor<string, []>("x_9_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_3_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_3_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1555893760)))];
            tensor<fp16, [1, 10240, 1, 77]> x_9_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_608, groups = var_499, pad = x_9_pad_0, pad_type = x_9_pad_type_0, strides = var_606, weight = block_3_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_21_cast_fp16)[name = tensor<string, []>("x_9_cast_fp16")];
            tensor<string, []> var_622_mode_0 = const()[name = tensor<string, []>("op_622_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_622_cast_fp16 = gelu(mode = var_622_mode_0, x = x_9_cast_fp16)[name = tensor<string, []>("op_622_cast_fp16")];
            tensor<int32, [2]> var_625 = const()[name = tensor<string, []>("op_625"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_627 = const()[name = tensor<string, []>("op_627"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_629_pad_type_0 = const()[name = tensor<string, []>("op_629_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_629_pad_0 = const()[name = tensor<string, []>("op_629_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_3_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_3_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1639779904)))];
            tensor<fp16, [1, 10240, 1, 77]> var_629_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_627, groups = var_499, pad = var_629_pad_0, pad_type = var_629_pad_type_0, strides = var_625, weight = block_3_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_21_cast_fp16)[name = tensor<string, []>("op_629_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_23_cast_fp16 = mul(x = var_622_cast_fp16, y = var_629_cast_fp16)[name = tensor<string, []>("input_23_cast_fp16")];
            tensor<int32, [2]> var_633 = const()[name = tensor<string, []>("op_633"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_635 = const()[name = tensor<string, []>("op_635"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_637_pad_type_0 = const()[name = tensor<string, []>("op_637_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_637_pad_0 = const()[name = tensor<string, []>("op_637_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_3_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_3_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1723666048)))];
            tensor<fp16, [1, 4096, 1, 77]> var_637_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_635, groups = var_499, pad = var_637_pad_0, pad_type = var_637_pad_type_0, strides = var_633, weight = block_3_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_23_cast_fp16)[name = tensor<string, []>("op_637_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_33_cast_fp16 = add(x = inputs_31_cast_fp16, y = var_637_cast_fp16)[name = tensor<string, []>("inputs_33_cast_fp16")];
            tensor<bool, []> var_642 = const()[name = tensor<string, []>("op_642"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_643 = const()[name = tensor<string, []>("op_643"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_647 = const()[name = tensor<string, []>("op_647"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_645_to_fp16 = const()[name = tensor<string, []>("op_645_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_644_to_fp16 = const()[name = tensor<string, []>("op_644_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_35_cast_fp16 = clip(alpha = var_645_to_fp16, beta = var_644_to_fp16, x = inputs_33_cast_fp16)[name = tensor<string, []>("inputs_35_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_17_cast_fp16 = mul(x = inputs_35_cast_fp16, y = inputs_35_cast_fp16)[name = tensor<string, []>("inputs_sq_17_cast_fp16")];
            tensor<int32, [1]> var_664 = const()[name = tensor<string, []>("op_664"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_17_cast_fp16 = reduce_mean(axes = var_664, keep_dims = var_642, x = inputs_sq_17_cast_fp16)[name = tensor<string, []>("variance_17_cast_fp16")];
            tensor<fp16, []> var_666_to_fp16 = const()[name = tensor<string, []>("op_666_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_667_cast_fp16 = add(x = variance_17_cast_fp16, y = var_666_to_fp16)[name = tensor<string, []>("op_667_cast_fp16")];
            tensor<fp16, []> var_668_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_668_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_668_cast_fp16 = rsqrt(epsilon = var_668_epsilon_0_to_fp16, x = var_667_cast_fp16)[name = tensor<string, []>("op_668_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_17_cast_fp16 = mul(x = inputs_35_cast_fp16, y = var_668_cast_fp16)[name = tensor<string, []>("hidden_states_17_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_17_to_fp16 = const()[name = tensor<string, []>("w_17_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1807552192)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_19_cast_fp16 = mul(x = w_17_to_fp16, y = hidden_states_17_cast_fp16)[name = tensor<string, []>("obj_19_cast_fp16")];
            tensor<int32, [2]> var_682 = const()[name = tensor<string, []>("op_682"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_684 = const()[name = tensor<string, []>("op_684"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_9_pad_type_0 = const()[name = tensor<string, []>("query_9_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_9_pad_0 = const()[name = tensor<string, []>("query_9_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_4_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_4_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1807560448)))];
            tensor<fp16, [1, 4096, 1, 77]> query_9_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_684, groups = var_643, pad = query_9_pad_0, pad_type = query_9_pad_type_0, strides = var_682, weight = block_4_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_19_cast_fp16)[name = tensor<string, []>("query_9_cast_fp16")];
            tensor<int32, [2]> var_688 = const()[name = tensor<string, []>("op_688"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_690 = const()[name = tensor<string, []>("op_690"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_9_pad_type_0 = const()[name = tensor<string, []>("key_9_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_9_pad_0 = const()[name = tensor<string, []>("key_9_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_4_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_4_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1841114944)))];
            tensor<fp16, [1, 4096, 1, 77]> key_9_cast_fp16 = conv(dilations = var_690, groups = var_643, pad = key_9_pad_0, pad_type = key_9_pad_type_0, strides = var_688, weight = block_4_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_19_cast_fp16)[name = tensor<string, []>("key_9_cast_fp16")];
            tensor<int32, [2]> var_695 = const()[name = tensor<string, []>("op_695"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_697 = const()[name = tensor<string, []>("op_697"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_9_pad_type_0 = const()[name = tensor<string, []>("value_9_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_9_pad_0 = const()[name = tensor<string, []>("value_9_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_4_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_4_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1874669440)))];
            tensor<fp16, [1, 4096, 1, 77]> value_9_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_697, groups = var_643, pad = value_9_pad_0, pad_type = value_9_pad_type_0, strides = var_695, weight = block_4_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_19_cast_fp16)[name = tensor<string, []>("value_9_cast_fp16")];
            tensor<int32, [4]> var_701 = const()[name = tensor<string, []>("op_701"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_702_cast_fp16 = reshape(shape = var_701, x = query_9_cast_fp16)[name = tensor<string, []>("op_702_cast_fp16")];
            tensor<int32, [4]> var_703 = const()[name = tensor<string, []>("op_703"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_704_cast_fp16 = reshape(shape = var_703, x = key_9_cast_fp16)[name = tensor<string, []>("op_704_cast_fp16")];
            tensor<bool, []> mh_w_25_transpose_x_0 = const()[name = tensor<string, []>("mh_w_25_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_25_transpose_y_0 = const()[name = tensor<string, []>("mh_w_25_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_25_cast_fp16 = matmul(transpose_x = mh_w_25_transpose_x_0, transpose_y = mh_w_25_transpose_y_0, x = var_702_cast_fp16, y = var_704_cast_fp16)[name = tensor<string, []>("mh_w_25_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_27_cast_fp16 = add(x = mh_w_25_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_27_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_29_cast_fp16 = add(x = mh_w_27_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_29_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_713_cast_fp16 = softmax(axis = var_647, x = mh_w_29_cast_fp16)[name = tensor<string, []>("op_713_cast_fp16")];
            tensor<int32, [4]> var_714 = const()[name = tensor<string, []>("op_714"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_715_cast_fp16 = reshape(shape = var_714, x = value_9_cast_fp16)[name = tensor<string, []>("op_715_cast_fp16")];
            tensor<bool, []> attn_9_transpose_x_0 = const()[name = tensor<string, []>("attn_9_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_9_transpose_y_0 = const()[name = tensor<string, []>("attn_9_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_9_cast_fp16 = matmul(transpose_x = attn_9_transpose_x_0, transpose_y = attn_9_transpose_y_0, x = var_715_cast_fp16, y = var_713_cast_fp16)[name = tensor<string, []>("attn_9_cast_fp16")];
            tensor<int32, [4]> var_718 = const()[name = tensor<string, []>("op_718"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_25_cast_fp16 = reshape(shape = var_718, x = attn_9_cast_fp16)[name = tensor<string, []>("input_25_cast_fp16")];
            tensor<int32, [2]> var_722 = const()[name = tensor<string, []>("op_722"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_724 = const()[name = tensor<string, []>("op_724"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_21_pad_type_0 = const()[name = tensor<string, []>("obj_21_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_21_pad_0 = const()[name = tensor<string, []>("obj_21_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_4_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_4_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1908223936)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_21_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_724, groups = var_643, pad = obj_21_pad_0, pad_type = obj_21_pad_type_0, strides = var_722, weight = block_4_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_25_cast_fp16)[name = tensor<string, []>("obj_21_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_37_cast_fp16 = add(x = inputs_35_cast_fp16, y = obj_21_cast_fp16)[name = tensor<string, []>("inputs_37_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_39_cast_fp16 = clip(alpha = var_645_to_fp16, beta = var_644_to_fp16, x = inputs_37_cast_fp16)[name = tensor<string, []>("inputs_39_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_19_cast_fp16 = mul(x = inputs_39_cast_fp16, y = inputs_39_cast_fp16)[name = tensor<string, []>("inputs_sq_19_cast_fp16")];
            tensor<int32, [1]> var_733 = const()[name = tensor<string, []>("op_733"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_19_cast_fp16 = reduce_mean(axes = var_733, keep_dims = var_642, x = inputs_sq_19_cast_fp16)[name = tensor<string, []>("variance_19_cast_fp16")];
            tensor<fp16, []> var_735_to_fp16 = const()[name = tensor<string, []>("op_735_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_736_cast_fp16 = add(x = variance_19_cast_fp16, y = var_735_to_fp16)[name = tensor<string, []>("op_736_cast_fp16")];
            tensor<fp16, []> var_737_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_737_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_737_cast_fp16 = rsqrt(epsilon = var_737_epsilon_0_to_fp16, x = var_736_cast_fp16)[name = tensor<string, []>("op_737_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_19_cast_fp16 = mul(x = inputs_39_cast_fp16, y = var_737_cast_fp16)[name = tensor<string, []>("hidden_states_19_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_19_to_fp16 = const()[name = tensor<string, []>("w_19_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1941778432)))];
            tensor<fp16, [1, 4096, 1, 77]> input_27_cast_fp16 = mul(x = w_19_to_fp16, y = hidden_states_19_cast_fp16)[name = tensor<string, []>("input_27_cast_fp16")];
            tensor<int32, [2]> var_750 = const()[name = tensor<string, []>("op_750"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_752 = const()[name = tensor<string, []>("op_752"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_11_pad_type_0 = const()[name = tensor<string, []>("x_11_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_11_pad_0 = const()[name = tensor<string, []>("x_11_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_4_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_4_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1941786688)))];
            tensor<fp16, [1, 10240, 1, 77]> x_11_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_752, groups = var_643, pad = x_11_pad_0, pad_type = x_11_pad_type_0, strides = var_750, weight = block_4_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_27_cast_fp16)[name = tensor<string, []>("x_11_cast_fp16")];
            tensor<string, []> var_766_mode_0 = const()[name = tensor<string, []>("op_766_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_766_cast_fp16 = gelu(mode = var_766_mode_0, x = x_11_cast_fp16)[name = tensor<string, []>("op_766_cast_fp16")];
            tensor<int32, [2]> var_769 = const()[name = tensor<string, []>("op_769"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_771 = const()[name = tensor<string, []>("op_771"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_773_pad_type_0 = const()[name = tensor<string, []>("op_773_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_773_pad_0 = const()[name = tensor<string, []>("op_773_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_4_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_4_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2025672832)))];
            tensor<fp16, [1, 10240, 1, 77]> var_773_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_771, groups = var_643, pad = var_773_pad_0, pad_type = var_773_pad_type_0, strides = var_769, weight = block_4_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_27_cast_fp16)[name = tensor<string, []>("op_773_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_29_cast_fp16 = mul(x = var_766_cast_fp16, y = var_773_cast_fp16)[name = tensor<string, []>("input_29_cast_fp16")];
            tensor<int32, [2]> var_777 = const()[name = tensor<string, []>("op_777"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_779 = const()[name = tensor<string, []>("op_779"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_781_pad_type_0 = const()[name = tensor<string, []>("op_781_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_781_pad_0 = const()[name = tensor<string, []>("op_781_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_4_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_4_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2109558976)))];
            tensor<fp16, [1, 4096, 1, 77]> var_781_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_779, groups = var_643, pad = var_781_pad_0, pad_type = var_781_pad_type_0, strides = var_777, weight = block_4_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_29_cast_fp16)[name = tensor<string, []>("op_781_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_41_cast_fp16 = add(x = inputs_39_cast_fp16, y = var_781_cast_fp16)[name = tensor<string, []>("inputs_41_cast_fp16")];
            tensor<bool, []> var_786 = const()[name = tensor<string, []>("op_786"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_787 = const()[name = tensor<string, []>("op_787"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_791 = const()[name = tensor<string, []>("op_791"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_789_to_fp16 = const()[name = tensor<string, []>("op_789_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_788_to_fp16 = const()[name = tensor<string, []>("op_788_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_43_cast_fp16 = clip(alpha = var_789_to_fp16, beta = var_788_to_fp16, x = inputs_41_cast_fp16)[name = tensor<string, []>("inputs_43_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_21_cast_fp16 = mul(x = inputs_43_cast_fp16, y = inputs_43_cast_fp16)[name = tensor<string, []>("inputs_sq_21_cast_fp16")];
            tensor<int32, [1]> var_808 = const()[name = tensor<string, []>("op_808"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_21_cast_fp16 = reduce_mean(axes = var_808, keep_dims = var_786, x = inputs_sq_21_cast_fp16)[name = tensor<string, []>("variance_21_cast_fp16")];
            tensor<fp16, []> var_810_to_fp16 = const()[name = tensor<string, []>("op_810_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_811_cast_fp16 = add(x = variance_21_cast_fp16, y = var_810_to_fp16)[name = tensor<string, []>("op_811_cast_fp16")];
            tensor<fp16, []> var_812_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_812_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_812_cast_fp16 = rsqrt(epsilon = var_812_epsilon_0_to_fp16, x = var_811_cast_fp16)[name = tensor<string, []>("op_812_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_21_cast_fp16 = mul(x = inputs_43_cast_fp16, y = var_812_cast_fp16)[name = tensor<string, []>("hidden_states_21_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_21_to_fp16 = const()[name = tensor<string, []>("w_21_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2193445120)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_23_cast_fp16 = mul(x = w_21_to_fp16, y = hidden_states_21_cast_fp16)[name = tensor<string, []>("obj_23_cast_fp16")];
            tensor<int32, [2]> var_826 = const()[name = tensor<string, []>("op_826"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_828 = const()[name = tensor<string, []>("op_828"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_11_pad_type_0 = const()[name = tensor<string, []>("query_11_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_11_pad_0 = const()[name = tensor<string, []>("query_11_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_5_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_5_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2193453376)))];
            tensor<fp16, [1, 4096, 1, 77]> query_11_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_828, groups = var_787, pad = query_11_pad_0, pad_type = query_11_pad_type_0, strides = var_826, weight = block_5_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_23_cast_fp16)[name = tensor<string, []>("query_11_cast_fp16")];
            tensor<int32, [2]> var_832 = const()[name = tensor<string, []>("op_832"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_834 = const()[name = tensor<string, []>("op_834"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_11_pad_type_0 = const()[name = tensor<string, []>("key_11_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_11_pad_0 = const()[name = tensor<string, []>("key_11_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_5_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_5_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2227007872)))];
            tensor<fp16, [1, 4096, 1, 77]> key_11_cast_fp16 = conv(dilations = var_834, groups = var_787, pad = key_11_pad_0, pad_type = key_11_pad_type_0, strides = var_832, weight = block_5_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_23_cast_fp16)[name = tensor<string, []>("key_11_cast_fp16")];
            tensor<int32, [2]> var_839 = const()[name = tensor<string, []>("op_839"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_841 = const()[name = tensor<string, []>("op_841"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_11_pad_type_0 = const()[name = tensor<string, []>("value_11_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_11_pad_0 = const()[name = tensor<string, []>("value_11_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_5_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_5_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2260562368)))];
            tensor<fp16, [1, 4096, 1, 77]> value_11_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_841, groups = var_787, pad = value_11_pad_0, pad_type = value_11_pad_type_0, strides = var_839, weight = block_5_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_23_cast_fp16)[name = tensor<string, []>("value_11_cast_fp16")];
            tensor<int32, [4]> var_845 = const()[name = tensor<string, []>("op_845"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_846_cast_fp16 = reshape(shape = var_845, x = query_11_cast_fp16)[name = tensor<string, []>("op_846_cast_fp16")];
            tensor<int32, [4]> var_847 = const()[name = tensor<string, []>("op_847"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_848_cast_fp16 = reshape(shape = var_847, x = key_11_cast_fp16)[name = tensor<string, []>("op_848_cast_fp16")];
            tensor<bool, []> mh_w_31_transpose_x_0 = const()[name = tensor<string, []>("mh_w_31_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_31_transpose_y_0 = const()[name = tensor<string, []>("mh_w_31_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_31_cast_fp16 = matmul(transpose_x = mh_w_31_transpose_x_0, transpose_y = mh_w_31_transpose_y_0, x = var_846_cast_fp16, y = var_848_cast_fp16)[name = tensor<string, []>("mh_w_31_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_33_cast_fp16 = add(x = mh_w_31_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_33_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_35_cast_fp16 = add(x = mh_w_33_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_35_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_857_cast_fp16 = softmax(axis = var_791, x = mh_w_35_cast_fp16)[name = tensor<string, []>("op_857_cast_fp16")];
            tensor<int32, [4]> var_858 = const()[name = tensor<string, []>("op_858"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_859_cast_fp16 = reshape(shape = var_858, x = value_11_cast_fp16)[name = tensor<string, []>("op_859_cast_fp16")];
            tensor<bool, []> attn_11_transpose_x_0 = const()[name = tensor<string, []>("attn_11_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_11_transpose_y_0 = const()[name = tensor<string, []>("attn_11_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_11_cast_fp16 = matmul(transpose_x = attn_11_transpose_x_0, transpose_y = attn_11_transpose_y_0, x = var_859_cast_fp16, y = var_857_cast_fp16)[name = tensor<string, []>("attn_11_cast_fp16")];
            tensor<int32, [4]> var_862 = const()[name = tensor<string, []>("op_862"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_31_cast_fp16 = reshape(shape = var_862, x = attn_11_cast_fp16)[name = tensor<string, []>("input_31_cast_fp16")];
            tensor<int32, [2]> var_866 = const()[name = tensor<string, []>("op_866"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_868 = const()[name = tensor<string, []>("op_868"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_25_pad_type_0 = const()[name = tensor<string, []>("obj_25_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_25_pad_0 = const()[name = tensor<string, []>("obj_25_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_5_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_5_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2294116864)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_25_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_868, groups = var_787, pad = obj_25_pad_0, pad_type = obj_25_pad_type_0, strides = var_866, weight = block_5_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_31_cast_fp16)[name = tensor<string, []>("obj_25_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_45_cast_fp16 = add(x = inputs_43_cast_fp16, y = obj_25_cast_fp16)[name = tensor<string, []>("inputs_45_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_47_cast_fp16 = clip(alpha = var_789_to_fp16, beta = var_788_to_fp16, x = inputs_45_cast_fp16)[name = tensor<string, []>("inputs_47_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_23_cast_fp16 = mul(x = inputs_47_cast_fp16, y = inputs_47_cast_fp16)[name = tensor<string, []>("inputs_sq_23_cast_fp16")];
            tensor<int32, [1]> var_877 = const()[name = tensor<string, []>("op_877"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_23_cast_fp16 = reduce_mean(axes = var_877, keep_dims = var_786, x = inputs_sq_23_cast_fp16)[name = tensor<string, []>("variance_23_cast_fp16")];
            tensor<fp16, []> var_879_to_fp16 = const()[name = tensor<string, []>("op_879_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_880_cast_fp16 = add(x = variance_23_cast_fp16, y = var_879_to_fp16)[name = tensor<string, []>("op_880_cast_fp16")];
            tensor<fp16, []> var_881_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_881_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_881_cast_fp16 = rsqrt(epsilon = var_881_epsilon_0_to_fp16, x = var_880_cast_fp16)[name = tensor<string, []>("op_881_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_23_cast_fp16 = mul(x = inputs_47_cast_fp16, y = var_881_cast_fp16)[name = tensor<string, []>("hidden_states_23_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_23_to_fp16 = const()[name = tensor<string, []>("w_23_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2327671360)))];
            tensor<fp16, [1, 4096, 1, 77]> input_33_cast_fp16 = mul(x = w_23_to_fp16, y = hidden_states_23_cast_fp16)[name = tensor<string, []>("input_33_cast_fp16")];
            tensor<int32, [2]> var_894 = const()[name = tensor<string, []>("op_894"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_896 = const()[name = tensor<string, []>("op_896"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_13_pad_type_0 = const()[name = tensor<string, []>("x_13_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_13_pad_0 = const()[name = tensor<string, []>("x_13_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_5_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_5_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2327679616)))];
            tensor<fp16, [1, 10240, 1, 77]> x_13_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_896, groups = var_787, pad = x_13_pad_0, pad_type = x_13_pad_type_0, strides = var_894, weight = block_5_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_33_cast_fp16)[name = tensor<string, []>("x_13_cast_fp16")];
            tensor<string, []> var_910_mode_0 = const()[name = tensor<string, []>("op_910_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_910_cast_fp16 = gelu(mode = var_910_mode_0, x = x_13_cast_fp16)[name = tensor<string, []>("op_910_cast_fp16")];
            tensor<int32, [2]> var_913 = const()[name = tensor<string, []>("op_913"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_915 = const()[name = tensor<string, []>("op_915"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_917_pad_type_0 = const()[name = tensor<string, []>("op_917_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_917_pad_0 = const()[name = tensor<string, []>("op_917_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_5_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_5_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2411565760)))];
            tensor<fp16, [1, 10240, 1, 77]> var_917_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_915, groups = var_787, pad = var_917_pad_0, pad_type = var_917_pad_type_0, strides = var_913, weight = block_5_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_33_cast_fp16)[name = tensor<string, []>("op_917_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_35_cast_fp16 = mul(x = var_910_cast_fp16, y = var_917_cast_fp16)[name = tensor<string, []>("input_35_cast_fp16")];
            tensor<int32, [2]> var_921 = const()[name = tensor<string, []>("op_921"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_923 = const()[name = tensor<string, []>("op_923"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_925_pad_type_0 = const()[name = tensor<string, []>("op_925_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_925_pad_0 = const()[name = tensor<string, []>("op_925_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_5_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_5_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2495451904)))];
            tensor<fp16, [1, 4096, 1, 77]> var_925_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_923, groups = var_787, pad = var_925_pad_0, pad_type = var_925_pad_type_0, strides = var_921, weight = block_5_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_35_cast_fp16)[name = tensor<string, []>("op_925_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_49_cast_fp16 = add(x = inputs_47_cast_fp16, y = var_925_cast_fp16)[name = tensor<string, []>("inputs_49_cast_fp16")];
            tensor<bool, []> var_930 = const()[name = tensor<string, []>("op_930"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_931 = const()[name = tensor<string, []>("op_931"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_935 = const()[name = tensor<string, []>("op_935"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_933_to_fp16 = const()[name = tensor<string, []>("op_933_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_932_to_fp16 = const()[name = tensor<string, []>("op_932_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_51_cast_fp16 = clip(alpha = var_933_to_fp16, beta = var_932_to_fp16, x = inputs_49_cast_fp16)[name = tensor<string, []>("inputs_51_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_25_cast_fp16 = mul(x = inputs_51_cast_fp16, y = inputs_51_cast_fp16)[name = tensor<string, []>("inputs_sq_25_cast_fp16")];
            tensor<int32, [1]> var_952 = const()[name = tensor<string, []>("op_952"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_25_cast_fp16 = reduce_mean(axes = var_952, keep_dims = var_930, x = inputs_sq_25_cast_fp16)[name = tensor<string, []>("variance_25_cast_fp16")];
            tensor<fp16, []> var_954_to_fp16 = const()[name = tensor<string, []>("op_954_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_955_cast_fp16 = add(x = variance_25_cast_fp16, y = var_954_to_fp16)[name = tensor<string, []>("op_955_cast_fp16")];
            tensor<fp16, []> var_956_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_956_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_956_cast_fp16 = rsqrt(epsilon = var_956_epsilon_0_to_fp16, x = var_955_cast_fp16)[name = tensor<string, []>("op_956_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_25_cast_fp16 = mul(x = inputs_51_cast_fp16, y = var_956_cast_fp16)[name = tensor<string, []>("hidden_states_25_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_25_to_fp16 = const()[name = tensor<string, []>("w_25_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2579338048)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_27_cast_fp16 = mul(x = w_25_to_fp16, y = hidden_states_25_cast_fp16)[name = tensor<string, []>("obj_27_cast_fp16")];
            tensor<int32, [2]> var_970 = const()[name = tensor<string, []>("op_970"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_972 = const()[name = tensor<string, []>("op_972"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_13_pad_type_0 = const()[name = tensor<string, []>("query_13_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_13_pad_0 = const()[name = tensor<string, []>("query_13_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_6_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_6_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2579346304)))];
            tensor<fp16, [1, 4096, 1, 77]> query_13_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_972, groups = var_931, pad = query_13_pad_0, pad_type = query_13_pad_type_0, strides = var_970, weight = block_6_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_27_cast_fp16)[name = tensor<string, []>("query_13_cast_fp16")];
            tensor<int32, [2]> var_976 = const()[name = tensor<string, []>("op_976"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_978 = const()[name = tensor<string, []>("op_978"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_13_pad_type_0 = const()[name = tensor<string, []>("key_13_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_13_pad_0 = const()[name = tensor<string, []>("key_13_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_6_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_6_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2612900800)))];
            tensor<fp16, [1, 4096, 1, 77]> key_13_cast_fp16 = conv(dilations = var_978, groups = var_931, pad = key_13_pad_0, pad_type = key_13_pad_type_0, strides = var_976, weight = block_6_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_27_cast_fp16)[name = tensor<string, []>("key_13_cast_fp16")];
            tensor<int32, [2]> var_983 = const()[name = tensor<string, []>("op_983"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_985 = const()[name = tensor<string, []>("op_985"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_13_pad_type_0 = const()[name = tensor<string, []>("value_13_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_13_pad_0 = const()[name = tensor<string, []>("value_13_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_6_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_6_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2646455296)))];
            tensor<fp16, [1, 4096, 1, 77]> value_13_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_985, groups = var_931, pad = value_13_pad_0, pad_type = value_13_pad_type_0, strides = var_983, weight = block_6_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_27_cast_fp16)[name = tensor<string, []>("value_13_cast_fp16")];
            tensor<int32, [4]> var_989 = const()[name = tensor<string, []>("op_989"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_990_cast_fp16 = reshape(shape = var_989, x = query_13_cast_fp16)[name = tensor<string, []>("op_990_cast_fp16")];
            tensor<int32, [4]> var_991 = const()[name = tensor<string, []>("op_991"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_992_cast_fp16 = reshape(shape = var_991, x = key_13_cast_fp16)[name = tensor<string, []>("op_992_cast_fp16")];
            tensor<bool, []> mh_w_37_transpose_x_0 = const()[name = tensor<string, []>("mh_w_37_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_37_transpose_y_0 = const()[name = tensor<string, []>("mh_w_37_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_37_cast_fp16 = matmul(transpose_x = mh_w_37_transpose_x_0, transpose_y = mh_w_37_transpose_y_0, x = var_990_cast_fp16, y = var_992_cast_fp16)[name = tensor<string, []>("mh_w_37_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_39_cast_fp16 = add(x = mh_w_37_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_39_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_41_cast_fp16 = add(x = mh_w_39_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_41_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_1001_cast_fp16 = softmax(axis = var_935, x = mh_w_41_cast_fp16)[name = tensor<string, []>("op_1001_cast_fp16")];
            tensor<int32, [4]> var_1002 = const()[name = tensor<string, []>("op_1002"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1003_cast_fp16 = reshape(shape = var_1002, x = value_13_cast_fp16)[name = tensor<string, []>("op_1003_cast_fp16")];
            tensor<bool, []> attn_13_transpose_x_0 = const()[name = tensor<string, []>("attn_13_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_13_transpose_y_0 = const()[name = tensor<string, []>("attn_13_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_13_cast_fp16 = matmul(transpose_x = attn_13_transpose_x_0, transpose_y = attn_13_transpose_y_0, x = var_1003_cast_fp16, y = var_1001_cast_fp16)[name = tensor<string, []>("attn_13_cast_fp16")];
            tensor<int32, [4]> var_1006 = const()[name = tensor<string, []>("op_1006"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_37_cast_fp16 = reshape(shape = var_1006, x = attn_13_cast_fp16)[name = tensor<string, []>("input_37_cast_fp16")];
            tensor<int32, [2]> var_1010 = const()[name = tensor<string, []>("op_1010"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1012 = const()[name = tensor<string, []>("op_1012"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_29_pad_type_0 = const()[name = tensor<string, []>("obj_29_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_29_pad_0 = const()[name = tensor<string, []>("obj_29_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_6_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_6_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2680009792)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_29_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1012, groups = var_931, pad = obj_29_pad_0, pad_type = obj_29_pad_type_0, strides = var_1010, weight = block_6_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_37_cast_fp16)[name = tensor<string, []>("obj_29_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_53_cast_fp16 = add(x = inputs_51_cast_fp16, y = obj_29_cast_fp16)[name = tensor<string, []>("inputs_53_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_55_cast_fp16 = clip(alpha = var_933_to_fp16, beta = var_932_to_fp16, x = inputs_53_cast_fp16)[name = tensor<string, []>("inputs_55_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_27_cast_fp16 = mul(x = inputs_55_cast_fp16, y = inputs_55_cast_fp16)[name = tensor<string, []>("inputs_sq_27_cast_fp16")];
            tensor<int32, [1]> var_1021 = const()[name = tensor<string, []>("op_1021"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_27_cast_fp16 = reduce_mean(axes = var_1021, keep_dims = var_930, x = inputs_sq_27_cast_fp16)[name = tensor<string, []>("variance_27_cast_fp16")];
            tensor<fp16, []> var_1023_to_fp16 = const()[name = tensor<string, []>("op_1023_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1024_cast_fp16 = add(x = variance_27_cast_fp16, y = var_1023_to_fp16)[name = tensor<string, []>("op_1024_cast_fp16")];
            tensor<fp16, []> var_1025_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1025_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1025_cast_fp16 = rsqrt(epsilon = var_1025_epsilon_0_to_fp16, x = var_1024_cast_fp16)[name = tensor<string, []>("op_1025_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_27_cast_fp16 = mul(x = inputs_55_cast_fp16, y = var_1025_cast_fp16)[name = tensor<string, []>("hidden_states_27_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_27_to_fp16 = const()[name = tensor<string, []>("w_27_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2713564288)))];
            tensor<fp16, [1, 4096, 1, 77]> input_39_cast_fp16 = mul(x = w_27_to_fp16, y = hidden_states_27_cast_fp16)[name = tensor<string, []>("input_39_cast_fp16")];
            tensor<int32, [2]> var_1038 = const()[name = tensor<string, []>("op_1038"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1040 = const()[name = tensor<string, []>("op_1040"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_15_pad_type_0 = const()[name = tensor<string, []>("x_15_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_15_pad_0 = const()[name = tensor<string, []>("x_15_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_6_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_6_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2713572544)))];
            tensor<fp16, [1, 10240, 1, 77]> x_15_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1040, groups = var_931, pad = x_15_pad_0, pad_type = x_15_pad_type_0, strides = var_1038, weight = block_6_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_39_cast_fp16)[name = tensor<string, []>("x_15_cast_fp16")];
            tensor<string, []> var_1054_mode_0 = const()[name = tensor<string, []>("op_1054_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_1054_cast_fp16 = gelu(mode = var_1054_mode_0, x = x_15_cast_fp16)[name = tensor<string, []>("op_1054_cast_fp16")];
            tensor<int32, [2]> var_1057 = const()[name = tensor<string, []>("op_1057"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1059 = const()[name = tensor<string, []>("op_1059"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1061_pad_type_0 = const()[name = tensor<string, []>("op_1061_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1061_pad_0 = const()[name = tensor<string, []>("op_1061_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_6_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_6_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2797458688)))];
            tensor<fp16, [1, 10240, 1, 77]> var_1061_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1059, groups = var_931, pad = var_1061_pad_0, pad_type = var_1061_pad_type_0, strides = var_1057, weight = block_6_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_39_cast_fp16)[name = tensor<string, []>("op_1061_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_41_cast_fp16 = mul(x = var_1054_cast_fp16, y = var_1061_cast_fp16)[name = tensor<string, []>("input_41_cast_fp16")];
            tensor<int32, [2]> var_1065 = const()[name = tensor<string, []>("op_1065"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1067 = const()[name = tensor<string, []>("op_1067"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1069_pad_type_0 = const()[name = tensor<string, []>("op_1069_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1069_pad_0 = const()[name = tensor<string, []>("op_1069_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_6_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_6_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2881344832)))];
            tensor<fp16, [1, 4096, 1, 77]> var_1069_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1067, groups = var_931, pad = var_1069_pad_0, pad_type = var_1069_pad_type_0, strides = var_1065, weight = block_6_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_41_cast_fp16)[name = tensor<string, []>("op_1069_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_57_cast_fp16 = add(x = inputs_55_cast_fp16, y = var_1069_cast_fp16)[name = tensor<string, []>("inputs_57_cast_fp16")];
            tensor<bool, []> var_1074 = const()[name = tensor<string, []>("op_1074"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_1075 = const()[name = tensor<string, []>("op_1075"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_1079 = const()[name = tensor<string, []>("op_1079"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_1077_to_fp16 = const()[name = tensor<string, []>("op_1077_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_1076_to_fp16 = const()[name = tensor<string, []>("op_1076_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_59_cast_fp16 = clip(alpha = var_1077_to_fp16, beta = var_1076_to_fp16, x = inputs_57_cast_fp16)[name = tensor<string, []>("inputs_59_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_29_cast_fp16 = mul(x = inputs_59_cast_fp16, y = inputs_59_cast_fp16)[name = tensor<string, []>("inputs_sq_29_cast_fp16")];
            tensor<int32, [1]> var_1096 = const()[name = tensor<string, []>("op_1096"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_29_cast_fp16 = reduce_mean(axes = var_1096, keep_dims = var_1074, x = inputs_sq_29_cast_fp16)[name = tensor<string, []>("variance_29_cast_fp16")];
            tensor<fp16, []> var_1098_to_fp16 = const()[name = tensor<string, []>("op_1098_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1099_cast_fp16 = add(x = variance_29_cast_fp16, y = var_1098_to_fp16)[name = tensor<string, []>("op_1099_cast_fp16")];
            tensor<fp16, []> var_1100_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1100_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1100_cast_fp16 = rsqrt(epsilon = var_1100_epsilon_0_to_fp16, x = var_1099_cast_fp16)[name = tensor<string, []>("op_1100_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_29_cast_fp16 = mul(x = inputs_59_cast_fp16, y = var_1100_cast_fp16)[name = tensor<string, []>("hidden_states_29_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_29_to_fp16 = const()[name = tensor<string, []>("w_29_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2965230976)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_31_cast_fp16 = mul(x = w_29_to_fp16, y = hidden_states_29_cast_fp16)[name = tensor<string, []>("obj_31_cast_fp16")];
            tensor<int32, [2]> var_1114 = const()[name = tensor<string, []>("op_1114"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1116 = const()[name = tensor<string, []>("op_1116"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_15_pad_type_0 = const()[name = tensor<string, []>("query_15_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_15_pad_0 = const()[name = tensor<string, []>("query_15_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_7_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_7_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2965239232)))];
            tensor<fp16, [1, 4096, 1, 77]> query_15_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1116, groups = var_1075, pad = query_15_pad_0, pad_type = query_15_pad_type_0, strides = var_1114, weight = block_7_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_31_cast_fp16)[name = tensor<string, []>("query_15_cast_fp16")];
            tensor<int32, [2]> var_1120 = const()[name = tensor<string, []>("op_1120"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1122 = const()[name = tensor<string, []>("op_1122"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_15_pad_type_0 = const()[name = tensor<string, []>("key_15_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_15_pad_0 = const()[name = tensor<string, []>("key_15_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_7_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_7_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(2998793728)))];
            tensor<fp16, [1, 4096, 1, 77]> key_15_cast_fp16 = conv(dilations = var_1122, groups = var_1075, pad = key_15_pad_0, pad_type = key_15_pad_type_0, strides = var_1120, weight = block_7_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_31_cast_fp16)[name = tensor<string, []>("key_15_cast_fp16")];
            tensor<int32, [2]> var_1127 = const()[name = tensor<string, []>("op_1127"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1129 = const()[name = tensor<string, []>("op_1129"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_15_pad_type_0 = const()[name = tensor<string, []>("value_15_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_15_pad_0 = const()[name = tensor<string, []>("value_15_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_7_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_7_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3032348224)))];
            tensor<fp16, [1, 4096, 1, 77]> value_15_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1129, groups = var_1075, pad = value_15_pad_0, pad_type = value_15_pad_type_0, strides = var_1127, weight = block_7_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_31_cast_fp16)[name = tensor<string, []>("value_15_cast_fp16")];
            tensor<int32, [4]> var_1133 = const()[name = tensor<string, []>("op_1133"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1134_cast_fp16 = reshape(shape = var_1133, x = query_15_cast_fp16)[name = tensor<string, []>("op_1134_cast_fp16")];
            tensor<int32, [4]> var_1135 = const()[name = tensor<string, []>("op_1135"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1136_cast_fp16 = reshape(shape = var_1135, x = key_15_cast_fp16)[name = tensor<string, []>("op_1136_cast_fp16")];
            tensor<bool, []> mh_w_43_transpose_x_0 = const()[name = tensor<string, []>("mh_w_43_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_43_transpose_y_0 = const()[name = tensor<string, []>("mh_w_43_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_43_cast_fp16 = matmul(transpose_x = mh_w_43_transpose_x_0, transpose_y = mh_w_43_transpose_y_0, x = var_1134_cast_fp16, y = var_1136_cast_fp16)[name = tensor<string, []>("mh_w_43_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_45_cast_fp16 = add(x = mh_w_43_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_45_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_47_cast_fp16 = add(x = mh_w_45_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_47_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_1145_cast_fp16 = softmax(axis = var_1079, x = mh_w_47_cast_fp16)[name = tensor<string, []>("op_1145_cast_fp16")];
            tensor<int32, [4]> var_1146 = const()[name = tensor<string, []>("op_1146"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1147_cast_fp16 = reshape(shape = var_1146, x = value_15_cast_fp16)[name = tensor<string, []>("op_1147_cast_fp16")];
            tensor<bool, []> attn_15_transpose_x_0 = const()[name = tensor<string, []>("attn_15_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_15_transpose_y_0 = const()[name = tensor<string, []>("attn_15_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_15_cast_fp16 = matmul(transpose_x = attn_15_transpose_x_0, transpose_y = attn_15_transpose_y_0, x = var_1147_cast_fp16, y = var_1145_cast_fp16)[name = tensor<string, []>("attn_15_cast_fp16")];
            tensor<int32, [4]> var_1150 = const()[name = tensor<string, []>("op_1150"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_43_cast_fp16 = reshape(shape = var_1150, x = attn_15_cast_fp16)[name = tensor<string, []>("input_43_cast_fp16")];
            tensor<int32, [2]> var_1154 = const()[name = tensor<string, []>("op_1154"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1156 = const()[name = tensor<string, []>("op_1156"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_33_pad_type_0 = const()[name = tensor<string, []>("obj_33_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_33_pad_0 = const()[name = tensor<string, []>("obj_33_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_7_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_7_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3065902720)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_33_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1156, groups = var_1075, pad = obj_33_pad_0, pad_type = obj_33_pad_type_0, strides = var_1154, weight = block_7_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_43_cast_fp16)[name = tensor<string, []>("obj_33_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_61_cast_fp16 = add(x = inputs_59_cast_fp16, y = obj_33_cast_fp16)[name = tensor<string, []>("inputs_61_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_63_cast_fp16 = clip(alpha = var_1077_to_fp16, beta = var_1076_to_fp16, x = inputs_61_cast_fp16)[name = tensor<string, []>("inputs_63_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_31_cast_fp16 = mul(x = inputs_63_cast_fp16, y = inputs_63_cast_fp16)[name = tensor<string, []>("inputs_sq_31_cast_fp16")];
            tensor<int32, [1]> var_1165 = const()[name = tensor<string, []>("op_1165"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_31_cast_fp16 = reduce_mean(axes = var_1165, keep_dims = var_1074, x = inputs_sq_31_cast_fp16)[name = tensor<string, []>("variance_31_cast_fp16")];
            tensor<fp16, []> var_1167_to_fp16 = const()[name = tensor<string, []>("op_1167_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1168_cast_fp16 = add(x = variance_31_cast_fp16, y = var_1167_to_fp16)[name = tensor<string, []>("op_1168_cast_fp16")];
            tensor<fp16, []> var_1169_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1169_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1169_cast_fp16 = rsqrt(epsilon = var_1169_epsilon_0_to_fp16, x = var_1168_cast_fp16)[name = tensor<string, []>("op_1169_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_31_cast_fp16 = mul(x = inputs_63_cast_fp16, y = var_1169_cast_fp16)[name = tensor<string, []>("hidden_states_31_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_31_to_fp16 = const()[name = tensor<string, []>("w_31_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3099457216)))];
            tensor<fp16, [1, 4096, 1, 77]> input_45_cast_fp16 = mul(x = w_31_to_fp16, y = hidden_states_31_cast_fp16)[name = tensor<string, []>("input_45_cast_fp16")];
            tensor<int32, [2]> var_1182 = const()[name = tensor<string, []>("op_1182"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1184 = const()[name = tensor<string, []>("op_1184"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_17_pad_type_0 = const()[name = tensor<string, []>("x_17_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_17_pad_0 = const()[name = tensor<string, []>("x_17_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_7_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_7_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3099465472)))];
            tensor<fp16, [1, 10240, 1, 77]> x_17_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1184, groups = var_1075, pad = x_17_pad_0, pad_type = x_17_pad_type_0, strides = var_1182, weight = block_7_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_45_cast_fp16)[name = tensor<string, []>("x_17_cast_fp16")];
            tensor<string, []> var_1198_mode_0 = const()[name = tensor<string, []>("op_1198_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_1198_cast_fp16 = gelu(mode = var_1198_mode_0, x = x_17_cast_fp16)[name = tensor<string, []>("op_1198_cast_fp16")];
            tensor<int32, [2]> var_1201 = const()[name = tensor<string, []>("op_1201"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1203 = const()[name = tensor<string, []>("op_1203"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1205_pad_type_0 = const()[name = tensor<string, []>("op_1205_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1205_pad_0 = const()[name = tensor<string, []>("op_1205_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_7_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_7_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3183351616)))];
            tensor<fp16, [1, 10240, 1, 77]> var_1205_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1203, groups = var_1075, pad = var_1205_pad_0, pad_type = var_1205_pad_type_0, strides = var_1201, weight = block_7_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_45_cast_fp16)[name = tensor<string, []>("op_1205_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_47_cast_fp16 = mul(x = var_1198_cast_fp16, y = var_1205_cast_fp16)[name = tensor<string, []>("input_47_cast_fp16")];
            tensor<int32, [2]> var_1209 = const()[name = tensor<string, []>("op_1209"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1211 = const()[name = tensor<string, []>("op_1211"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1213_pad_type_0 = const()[name = tensor<string, []>("op_1213_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1213_pad_0 = const()[name = tensor<string, []>("op_1213_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_7_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_7_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3267237760)))];
            tensor<fp16, [1, 4096, 1, 77]> var_1213_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1211, groups = var_1075, pad = var_1213_pad_0, pad_type = var_1213_pad_type_0, strides = var_1209, weight = block_7_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_47_cast_fp16)[name = tensor<string, []>("op_1213_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_65_cast_fp16 = add(x = inputs_63_cast_fp16, y = var_1213_cast_fp16)[name = tensor<string, []>("inputs_65_cast_fp16")];
            tensor<bool, []> var_1218 = const()[name = tensor<string, []>("op_1218"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_1219 = const()[name = tensor<string, []>("op_1219"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_1223 = const()[name = tensor<string, []>("op_1223"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_1221_to_fp16 = const()[name = tensor<string, []>("op_1221_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_1220_to_fp16 = const()[name = tensor<string, []>("op_1220_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_67_cast_fp16 = clip(alpha = var_1221_to_fp16, beta = var_1220_to_fp16, x = inputs_65_cast_fp16)[name = tensor<string, []>("inputs_67_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_33_cast_fp16 = mul(x = inputs_67_cast_fp16, y = inputs_67_cast_fp16)[name = tensor<string, []>("inputs_sq_33_cast_fp16")];
            tensor<int32, [1]> var_1240 = const()[name = tensor<string, []>("op_1240"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_33_cast_fp16 = reduce_mean(axes = var_1240, keep_dims = var_1218, x = inputs_sq_33_cast_fp16)[name = tensor<string, []>("variance_33_cast_fp16")];
            tensor<fp16, []> var_1242_to_fp16 = const()[name = tensor<string, []>("op_1242_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1243_cast_fp16 = add(x = variance_33_cast_fp16, y = var_1242_to_fp16)[name = tensor<string, []>("op_1243_cast_fp16")];
            tensor<fp16, []> var_1244_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1244_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1244_cast_fp16 = rsqrt(epsilon = var_1244_epsilon_0_to_fp16, x = var_1243_cast_fp16)[name = tensor<string, []>("op_1244_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_33_cast_fp16 = mul(x = inputs_67_cast_fp16, y = var_1244_cast_fp16)[name = tensor<string, []>("hidden_states_33_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_33_to_fp16 = const()[name = tensor<string, []>("w_33_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3351123904)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_35_cast_fp16 = mul(x = w_33_to_fp16, y = hidden_states_33_cast_fp16)[name = tensor<string, []>("obj_35_cast_fp16")];
            tensor<int32, [2]> var_1258 = const()[name = tensor<string, []>("op_1258"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1260 = const()[name = tensor<string, []>("op_1260"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_17_pad_type_0 = const()[name = tensor<string, []>("query_17_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_17_pad_0 = const()[name = tensor<string, []>("query_17_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_8_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_8_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3351132160)))];
            tensor<fp16, [1, 4096, 1, 77]> query_17_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1260, groups = var_1219, pad = query_17_pad_0, pad_type = query_17_pad_type_0, strides = var_1258, weight = block_8_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_35_cast_fp16)[name = tensor<string, []>("query_17_cast_fp16")];
            tensor<int32, [2]> var_1264 = const()[name = tensor<string, []>("op_1264"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1266 = const()[name = tensor<string, []>("op_1266"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_17_pad_type_0 = const()[name = tensor<string, []>("key_17_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_17_pad_0 = const()[name = tensor<string, []>("key_17_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_8_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_8_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3384686656)))];
            tensor<fp16, [1, 4096, 1, 77]> key_17_cast_fp16 = conv(dilations = var_1266, groups = var_1219, pad = key_17_pad_0, pad_type = key_17_pad_type_0, strides = var_1264, weight = block_8_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_35_cast_fp16)[name = tensor<string, []>("key_17_cast_fp16")];
            tensor<int32, [2]> var_1271 = const()[name = tensor<string, []>("op_1271"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1273 = const()[name = tensor<string, []>("op_1273"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_17_pad_type_0 = const()[name = tensor<string, []>("value_17_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_17_pad_0 = const()[name = tensor<string, []>("value_17_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_8_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_8_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3418241152)))];
            tensor<fp16, [1, 4096, 1, 77]> value_17_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1273, groups = var_1219, pad = value_17_pad_0, pad_type = value_17_pad_type_0, strides = var_1271, weight = block_8_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_35_cast_fp16)[name = tensor<string, []>("value_17_cast_fp16")];
            tensor<int32, [4]> var_1277 = const()[name = tensor<string, []>("op_1277"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1278_cast_fp16 = reshape(shape = var_1277, x = query_17_cast_fp16)[name = tensor<string, []>("op_1278_cast_fp16")];
            tensor<int32, [4]> var_1279 = const()[name = tensor<string, []>("op_1279"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1280_cast_fp16 = reshape(shape = var_1279, x = key_17_cast_fp16)[name = tensor<string, []>("op_1280_cast_fp16")];
            tensor<bool, []> mh_w_49_transpose_x_0 = const()[name = tensor<string, []>("mh_w_49_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_49_transpose_y_0 = const()[name = tensor<string, []>("mh_w_49_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_49_cast_fp16 = matmul(transpose_x = mh_w_49_transpose_x_0, transpose_y = mh_w_49_transpose_y_0, x = var_1278_cast_fp16, y = var_1280_cast_fp16)[name = tensor<string, []>("mh_w_49_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_51_cast_fp16 = add(x = mh_w_49_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_51_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_53_cast_fp16 = add(x = mh_w_51_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_53_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_1289_cast_fp16 = softmax(axis = var_1223, x = mh_w_53_cast_fp16)[name = tensor<string, []>("op_1289_cast_fp16")];
            tensor<int32, [4]> var_1290 = const()[name = tensor<string, []>("op_1290"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1291_cast_fp16 = reshape(shape = var_1290, x = value_17_cast_fp16)[name = tensor<string, []>("op_1291_cast_fp16")];
            tensor<bool, []> attn_17_transpose_x_0 = const()[name = tensor<string, []>("attn_17_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_17_transpose_y_0 = const()[name = tensor<string, []>("attn_17_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_17_cast_fp16 = matmul(transpose_x = attn_17_transpose_x_0, transpose_y = attn_17_transpose_y_0, x = var_1291_cast_fp16, y = var_1289_cast_fp16)[name = tensor<string, []>("attn_17_cast_fp16")];
            tensor<int32, [4]> var_1294 = const()[name = tensor<string, []>("op_1294"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_49_cast_fp16 = reshape(shape = var_1294, x = attn_17_cast_fp16)[name = tensor<string, []>("input_49_cast_fp16")];
            tensor<int32, [2]> var_1298 = const()[name = tensor<string, []>("op_1298"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1300 = const()[name = tensor<string, []>("op_1300"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_37_pad_type_0 = const()[name = tensor<string, []>("obj_37_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_37_pad_0 = const()[name = tensor<string, []>("obj_37_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_8_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_8_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3451795648)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_37_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1300, groups = var_1219, pad = obj_37_pad_0, pad_type = obj_37_pad_type_0, strides = var_1298, weight = block_8_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_49_cast_fp16)[name = tensor<string, []>("obj_37_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_69_cast_fp16 = add(x = inputs_67_cast_fp16, y = obj_37_cast_fp16)[name = tensor<string, []>("inputs_69_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_71_cast_fp16 = clip(alpha = var_1221_to_fp16, beta = var_1220_to_fp16, x = inputs_69_cast_fp16)[name = tensor<string, []>("inputs_71_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_35_cast_fp16 = mul(x = inputs_71_cast_fp16, y = inputs_71_cast_fp16)[name = tensor<string, []>("inputs_sq_35_cast_fp16")];
            tensor<int32, [1]> var_1309 = const()[name = tensor<string, []>("op_1309"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_35_cast_fp16 = reduce_mean(axes = var_1309, keep_dims = var_1218, x = inputs_sq_35_cast_fp16)[name = tensor<string, []>("variance_35_cast_fp16")];
            tensor<fp16, []> var_1311_to_fp16 = const()[name = tensor<string, []>("op_1311_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1312_cast_fp16 = add(x = variance_35_cast_fp16, y = var_1311_to_fp16)[name = tensor<string, []>("op_1312_cast_fp16")];
            tensor<fp16, []> var_1313_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1313_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1313_cast_fp16 = rsqrt(epsilon = var_1313_epsilon_0_to_fp16, x = var_1312_cast_fp16)[name = tensor<string, []>("op_1313_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_35_cast_fp16 = mul(x = inputs_71_cast_fp16, y = var_1313_cast_fp16)[name = tensor<string, []>("hidden_states_35_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_35_to_fp16 = const()[name = tensor<string, []>("w_35_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3485350144)))];
            tensor<fp16, [1, 4096, 1, 77]> input_51_cast_fp16 = mul(x = w_35_to_fp16, y = hidden_states_35_cast_fp16)[name = tensor<string, []>("input_51_cast_fp16")];
            tensor<int32, [2]> var_1326 = const()[name = tensor<string, []>("op_1326"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1328 = const()[name = tensor<string, []>("op_1328"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_19_pad_type_0 = const()[name = tensor<string, []>("x_19_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_19_pad_0 = const()[name = tensor<string, []>("x_19_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_8_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_8_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3485358400)))];
            tensor<fp16, [1, 10240, 1, 77]> x_19_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1328, groups = var_1219, pad = x_19_pad_0, pad_type = x_19_pad_type_0, strides = var_1326, weight = block_8_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_51_cast_fp16)[name = tensor<string, []>("x_19_cast_fp16")];
            tensor<string, []> var_1342_mode_0 = const()[name = tensor<string, []>("op_1342_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_1342_cast_fp16 = gelu(mode = var_1342_mode_0, x = x_19_cast_fp16)[name = tensor<string, []>("op_1342_cast_fp16")];
            tensor<int32, [2]> var_1345 = const()[name = tensor<string, []>("op_1345"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1347 = const()[name = tensor<string, []>("op_1347"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1349_pad_type_0 = const()[name = tensor<string, []>("op_1349_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1349_pad_0 = const()[name = tensor<string, []>("op_1349_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_8_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_8_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3569244544)))];
            tensor<fp16, [1, 10240, 1, 77]> var_1349_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1347, groups = var_1219, pad = var_1349_pad_0, pad_type = var_1349_pad_type_0, strides = var_1345, weight = block_8_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_51_cast_fp16)[name = tensor<string, []>("op_1349_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_53_cast_fp16 = mul(x = var_1342_cast_fp16, y = var_1349_cast_fp16)[name = tensor<string, []>("input_53_cast_fp16")];
            tensor<int32, [2]> var_1353 = const()[name = tensor<string, []>("op_1353"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1355 = const()[name = tensor<string, []>("op_1355"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1357_pad_type_0 = const()[name = tensor<string, []>("op_1357_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1357_pad_0 = const()[name = tensor<string, []>("op_1357_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_8_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_8_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3653130688)))];
            tensor<fp16, [1, 4096, 1, 77]> var_1357_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1355, groups = var_1219, pad = var_1357_pad_0, pad_type = var_1357_pad_type_0, strides = var_1353, weight = block_8_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_53_cast_fp16)[name = tensor<string, []>("op_1357_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_73_cast_fp16 = add(x = inputs_71_cast_fp16, y = var_1357_cast_fp16)[name = tensor<string, []>("inputs_73_cast_fp16")];
            tensor<bool, []> var_1362 = const()[name = tensor<string, []>("op_1362"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_1363 = const()[name = tensor<string, []>("op_1363"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_1367 = const()[name = tensor<string, []>("op_1367"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_1365_to_fp16 = const()[name = tensor<string, []>("op_1365_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_1364_to_fp16 = const()[name = tensor<string, []>("op_1364_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_75_cast_fp16 = clip(alpha = var_1365_to_fp16, beta = var_1364_to_fp16, x = inputs_73_cast_fp16)[name = tensor<string, []>("inputs_75_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_37_cast_fp16 = mul(x = inputs_75_cast_fp16, y = inputs_75_cast_fp16)[name = tensor<string, []>("inputs_sq_37_cast_fp16")];
            tensor<int32, [1]> var_1384 = const()[name = tensor<string, []>("op_1384"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_37_cast_fp16 = reduce_mean(axes = var_1384, keep_dims = var_1362, x = inputs_sq_37_cast_fp16)[name = tensor<string, []>("variance_37_cast_fp16")];
            tensor<fp16, []> var_1386_to_fp16 = const()[name = tensor<string, []>("op_1386_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1387_cast_fp16 = add(x = variance_37_cast_fp16, y = var_1386_to_fp16)[name = tensor<string, []>("op_1387_cast_fp16")];
            tensor<fp16, []> var_1388_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1388_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1388_cast_fp16 = rsqrt(epsilon = var_1388_epsilon_0_to_fp16, x = var_1387_cast_fp16)[name = tensor<string, []>("op_1388_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_37_cast_fp16 = mul(x = inputs_75_cast_fp16, y = var_1388_cast_fp16)[name = tensor<string, []>("hidden_states_37_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_37_to_fp16 = const()[name = tensor<string, []>("w_37_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3737016832)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_39_cast_fp16 = mul(x = w_37_to_fp16, y = hidden_states_37_cast_fp16)[name = tensor<string, []>("obj_39_cast_fp16")];
            tensor<int32, [2]> var_1402 = const()[name = tensor<string, []>("op_1402"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1404 = const()[name = tensor<string, []>("op_1404"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_19_pad_type_0 = const()[name = tensor<string, []>("query_19_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_19_pad_0 = const()[name = tensor<string, []>("query_19_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_9_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_9_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3737025088)))];
            tensor<fp16, [1, 4096, 1, 77]> query_19_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1404, groups = var_1363, pad = query_19_pad_0, pad_type = query_19_pad_type_0, strides = var_1402, weight = block_9_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_39_cast_fp16)[name = tensor<string, []>("query_19_cast_fp16")];
            tensor<int32, [2]> var_1408 = const()[name = tensor<string, []>("op_1408"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1410 = const()[name = tensor<string, []>("op_1410"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_19_pad_type_0 = const()[name = tensor<string, []>("key_19_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_19_pad_0 = const()[name = tensor<string, []>("key_19_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_9_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_9_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3770579584)))];
            tensor<fp16, [1, 4096, 1, 77]> key_19_cast_fp16 = conv(dilations = var_1410, groups = var_1363, pad = key_19_pad_0, pad_type = key_19_pad_type_0, strides = var_1408, weight = block_9_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_39_cast_fp16)[name = tensor<string, []>("key_19_cast_fp16")];
            tensor<int32, [2]> var_1415 = const()[name = tensor<string, []>("op_1415"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1417 = const()[name = tensor<string, []>("op_1417"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_19_pad_type_0 = const()[name = tensor<string, []>("value_19_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_19_pad_0 = const()[name = tensor<string, []>("value_19_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_9_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_9_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3804134080)))];
            tensor<fp16, [1, 4096, 1, 77]> value_19_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1417, groups = var_1363, pad = value_19_pad_0, pad_type = value_19_pad_type_0, strides = var_1415, weight = block_9_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_39_cast_fp16)[name = tensor<string, []>("value_19_cast_fp16")];
            tensor<int32, [4]> var_1421 = const()[name = tensor<string, []>("op_1421"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1422_cast_fp16 = reshape(shape = var_1421, x = query_19_cast_fp16)[name = tensor<string, []>("op_1422_cast_fp16")];
            tensor<int32, [4]> var_1423 = const()[name = tensor<string, []>("op_1423"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1424_cast_fp16 = reshape(shape = var_1423, x = key_19_cast_fp16)[name = tensor<string, []>("op_1424_cast_fp16")];
            tensor<bool, []> mh_w_55_transpose_x_0 = const()[name = tensor<string, []>("mh_w_55_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_55_transpose_y_0 = const()[name = tensor<string, []>("mh_w_55_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_55_cast_fp16 = matmul(transpose_x = mh_w_55_transpose_x_0, transpose_y = mh_w_55_transpose_y_0, x = var_1422_cast_fp16, y = var_1424_cast_fp16)[name = tensor<string, []>("mh_w_55_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_57_cast_fp16 = add(x = mh_w_55_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_57_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_59_cast_fp16 = add(x = mh_w_57_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_59_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_1433_cast_fp16 = softmax(axis = var_1367, x = mh_w_59_cast_fp16)[name = tensor<string, []>("op_1433_cast_fp16")];
            tensor<int32, [4]> var_1434 = const()[name = tensor<string, []>("op_1434"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1435_cast_fp16 = reshape(shape = var_1434, x = value_19_cast_fp16)[name = tensor<string, []>("op_1435_cast_fp16")];
            tensor<bool, []> attn_19_transpose_x_0 = const()[name = tensor<string, []>("attn_19_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_19_transpose_y_0 = const()[name = tensor<string, []>("attn_19_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_19_cast_fp16 = matmul(transpose_x = attn_19_transpose_x_0, transpose_y = attn_19_transpose_y_0, x = var_1435_cast_fp16, y = var_1433_cast_fp16)[name = tensor<string, []>("attn_19_cast_fp16")];
            tensor<int32, [4]> var_1438 = const()[name = tensor<string, []>("op_1438"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_55_cast_fp16 = reshape(shape = var_1438, x = attn_19_cast_fp16)[name = tensor<string, []>("input_55_cast_fp16")];
            tensor<int32, [2]> var_1442 = const()[name = tensor<string, []>("op_1442"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1444 = const()[name = tensor<string, []>("op_1444"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_41_pad_type_0 = const()[name = tensor<string, []>("obj_41_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_41_pad_0 = const()[name = tensor<string, []>("obj_41_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_9_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_9_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3837688576)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_41_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1444, groups = var_1363, pad = obj_41_pad_0, pad_type = obj_41_pad_type_0, strides = var_1442, weight = block_9_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_55_cast_fp16)[name = tensor<string, []>("obj_41_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_77_cast_fp16 = add(x = inputs_75_cast_fp16, y = obj_41_cast_fp16)[name = tensor<string, []>("inputs_77_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_79_cast_fp16 = clip(alpha = var_1365_to_fp16, beta = var_1364_to_fp16, x = inputs_77_cast_fp16)[name = tensor<string, []>("inputs_79_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_39_cast_fp16 = mul(x = inputs_79_cast_fp16, y = inputs_79_cast_fp16)[name = tensor<string, []>("inputs_sq_39_cast_fp16")];
            tensor<int32, [1]> var_1453 = const()[name = tensor<string, []>("op_1453"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_39_cast_fp16 = reduce_mean(axes = var_1453, keep_dims = var_1362, x = inputs_sq_39_cast_fp16)[name = tensor<string, []>("variance_39_cast_fp16")];
            tensor<fp16, []> var_1455_to_fp16 = const()[name = tensor<string, []>("op_1455_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1456_cast_fp16 = add(x = variance_39_cast_fp16, y = var_1455_to_fp16)[name = tensor<string, []>("op_1456_cast_fp16")];
            tensor<fp16, []> var_1457_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1457_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1457_cast_fp16 = rsqrt(epsilon = var_1457_epsilon_0_to_fp16, x = var_1456_cast_fp16)[name = tensor<string, []>("op_1457_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_39_cast_fp16 = mul(x = inputs_79_cast_fp16, y = var_1457_cast_fp16)[name = tensor<string, []>("hidden_states_39_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_39_to_fp16 = const()[name = tensor<string, []>("w_39_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3871243072)))];
            tensor<fp16, [1, 4096, 1, 77]> input_57_cast_fp16 = mul(x = w_39_to_fp16, y = hidden_states_39_cast_fp16)[name = tensor<string, []>("input_57_cast_fp16")];
            tensor<int32, [2]> var_1470 = const()[name = tensor<string, []>("op_1470"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1472 = const()[name = tensor<string, []>("op_1472"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_21_pad_type_0 = const()[name = tensor<string, []>("x_21_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_21_pad_0 = const()[name = tensor<string, []>("x_21_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_9_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_9_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3871251328)))];
            tensor<fp16, [1, 10240, 1, 77]> x_21_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1472, groups = var_1363, pad = x_21_pad_0, pad_type = x_21_pad_type_0, strides = var_1470, weight = block_9_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_57_cast_fp16)[name = tensor<string, []>("x_21_cast_fp16")];
            tensor<string, []> var_1486_mode_0 = const()[name = tensor<string, []>("op_1486_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_1486_cast_fp16 = gelu(mode = var_1486_mode_0, x = x_21_cast_fp16)[name = tensor<string, []>("op_1486_cast_fp16")];
            tensor<int32, [2]> var_1489 = const()[name = tensor<string, []>("op_1489"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1491 = const()[name = tensor<string, []>("op_1491"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1493_pad_type_0 = const()[name = tensor<string, []>("op_1493_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1493_pad_0 = const()[name = tensor<string, []>("op_1493_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_9_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_9_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3955137472)))];
            tensor<fp16, [1, 10240, 1, 77]> var_1493_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1491, groups = var_1363, pad = var_1493_pad_0, pad_type = var_1493_pad_type_0, strides = var_1489, weight = block_9_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_57_cast_fp16)[name = tensor<string, []>("op_1493_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_59_cast_fp16 = mul(x = var_1486_cast_fp16, y = var_1493_cast_fp16)[name = tensor<string, []>("input_59_cast_fp16")];
            tensor<int32, [2]> var_1497 = const()[name = tensor<string, []>("op_1497"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1499 = const()[name = tensor<string, []>("op_1499"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1501_pad_type_0 = const()[name = tensor<string, []>("op_1501_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1501_pad_0 = const()[name = tensor<string, []>("op_1501_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_9_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_9_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4039023616)))];
            tensor<fp16, [1, 4096, 1, 77]> var_1501_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1499, groups = var_1363, pad = var_1501_pad_0, pad_type = var_1501_pad_type_0, strides = var_1497, weight = block_9_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_59_cast_fp16)[name = tensor<string, []>("op_1501_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_81_cast_fp16 = add(x = inputs_79_cast_fp16, y = var_1501_cast_fp16)[name = tensor<string, []>("inputs_81_cast_fp16")];
            tensor<bool, []> var_1506 = const()[name = tensor<string, []>("op_1506"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_1507 = const()[name = tensor<string, []>("op_1507"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_1511 = const()[name = tensor<string, []>("op_1511"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_1509_to_fp16 = const()[name = tensor<string, []>("op_1509_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_1508_to_fp16 = const()[name = tensor<string, []>("op_1508_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_83_cast_fp16 = clip(alpha = var_1509_to_fp16, beta = var_1508_to_fp16, x = inputs_81_cast_fp16)[name = tensor<string, []>("inputs_83_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_41_cast_fp16 = mul(x = inputs_83_cast_fp16, y = inputs_83_cast_fp16)[name = tensor<string, []>("inputs_sq_41_cast_fp16")];
            tensor<int32, [1]> var_1528 = const()[name = tensor<string, []>("op_1528"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_41_cast_fp16 = reduce_mean(axes = var_1528, keep_dims = var_1506, x = inputs_sq_41_cast_fp16)[name = tensor<string, []>("variance_41_cast_fp16")];
            tensor<fp16, []> var_1530_to_fp16 = const()[name = tensor<string, []>("op_1530_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1531_cast_fp16 = add(x = variance_41_cast_fp16, y = var_1530_to_fp16)[name = tensor<string, []>("op_1531_cast_fp16")];
            tensor<fp16, []> var_1532_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1532_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1532_cast_fp16 = rsqrt(epsilon = var_1532_epsilon_0_to_fp16, x = var_1531_cast_fp16)[name = tensor<string, []>("op_1532_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_41_cast_fp16 = mul(x = inputs_83_cast_fp16, y = var_1532_cast_fp16)[name = tensor<string, []>("hidden_states_41_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_41_to_fp16 = const()[name = tensor<string, []>("w_41_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4122909760)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_43_cast_fp16 = mul(x = w_41_to_fp16, y = hidden_states_41_cast_fp16)[name = tensor<string, []>("obj_43_cast_fp16")];
            tensor<int32, [2]> var_1546 = const()[name = tensor<string, []>("op_1546"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1548 = const()[name = tensor<string, []>("op_1548"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_21_pad_type_0 = const()[name = tensor<string, []>("query_21_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_21_pad_0 = const()[name = tensor<string, []>("query_21_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_10_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_10_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4122918016)))];
            tensor<fp16, [1, 4096, 1, 77]> query_21_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1548, groups = var_1507, pad = query_21_pad_0, pad_type = query_21_pad_type_0, strides = var_1546, weight = block_10_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_43_cast_fp16)[name = tensor<string, []>("query_21_cast_fp16")];
            tensor<int32, [2]> var_1552 = const()[name = tensor<string, []>("op_1552"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1554 = const()[name = tensor<string, []>("op_1554"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_21_pad_type_0 = const()[name = tensor<string, []>("key_21_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_21_pad_0 = const()[name = tensor<string, []>("key_21_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_10_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_10_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4156472512)))];
            tensor<fp16, [1, 4096, 1, 77]> key_21_cast_fp16 = conv(dilations = var_1554, groups = var_1507, pad = key_21_pad_0, pad_type = key_21_pad_type_0, strides = var_1552, weight = block_10_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_43_cast_fp16)[name = tensor<string, []>("key_21_cast_fp16")];
            tensor<int32, [2]> var_1559 = const()[name = tensor<string, []>("op_1559"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1561 = const()[name = tensor<string, []>("op_1561"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_21_pad_type_0 = const()[name = tensor<string, []>("value_21_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_21_pad_0 = const()[name = tensor<string, []>("value_21_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_10_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_10_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4190027008)))];
            tensor<fp16, [1, 4096, 1, 77]> value_21_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1561, groups = var_1507, pad = value_21_pad_0, pad_type = value_21_pad_type_0, strides = var_1559, weight = block_10_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_43_cast_fp16)[name = tensor<string, []>("value_21_cast_fp16")];
            tensor<int32, [4]> var_1565 = const()[name = tensor<string, []>("op_1565"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1566_cast_fp16 = reshape(shape = var_1565, x = query_21_cast_fp16)[name = tensor<string, []>("op_1566_cast_fp16")];
            tensor<int32, [4]> var_1567 = const()[name = tensor<string, []>("op_1567"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1568_cast_fp16 = reshape(shape = var_1567, x = key_21_cast_fp16)[name = tensor<string, []>("op_1568_cast_fp16")];
            tensor<bool, []> mh_w_61_transpose_x_0 = const()[name = tensor<string, []>("mh_w_61_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_61_transpose_y_0 = const()[name = tensor<string, []>("mh_w_61_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_61_cast_fp16 = matmul(transpose_x = mh_w_61_transpose_x_0, transpose_y = mh_w_61_transpose_y_0, x = var_1566_cast_fp16, y = var_1568_cast_fp16)[name = tensor<string, []>("mh_w_61_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_63_cast_fp16 = add(x = mh_w_61_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_63_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_65_cast_fp16 = add(x = mh_w_63_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_65_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_1577_cast_fp16 = softmax(axis = var_1511, x = mh_w_65_cast_fp16)[name = tensor<string, []>("op_1577_cast_fp16")];
            tensor<int32, [4]> var_1578 = const()[name = tensor<string, []>("op_1578"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1579_cast_fp16 = reshape(shape = var_1578, x = value_21_cast_fp16)[name = tensor<string, []>("op_1579_cast_fp16")];
            tensor<bool, []> attn_21_transpose_x_0 = const()[name = tensor<string, []>("attn_21_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_21_transpose_y_0 = const()[name = tensor<string, []>("attn_21_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_21_cast_fp16 = matmul(transpose_x = attn_21_transpose_x_0, transpose_y = attn_21_transpose_y_0, x = var_1579_cast_fp16, y = var_1577_cast_fp16)[name = tensor<string, []>("attn_21_cast_fp16")];
            tensor<int32, [4]> var_1582 = const()[name = tensor<string, []>("op_1582"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_61_cast_fp16 = reshape(shape = var_1582, x = attn_21_cast_fp16)[name = tensor<string, []>("input_61_cast_fp16")];
            tensor<int32, [2]> var_1586 = const()[name = tensor<string, []>("op_1586"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1588 = const()[name = tensor<string, []>("op_1588"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_45_pad_type_0 = const()[name = tensor<string, []>("obj_45_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_45_pad_0 = const()[name = tensor<string, []>("obj_45_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_10_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_10_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4223581504)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_45_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1588, groups = var_1507, pad = obj_45_pad_0, pad_type = obj_45_pad_type_0, strides = var_1586, weight = block_10_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_61_cast_fp16)[name = tensor<string, []>("obj_45_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_85_cast_fp16 = add(x = inputs_83_cast_fp16, y = obj_45_cast_fp16)[name = tensor<string, []>("inputs_85_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_87_cast_fp16 = clip(alpha = var_1509_to_fp16, beta = var_1508_to_fp16, x = inputs_85_cast_fp16)[name = tensor<string, []>("inputs_87_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_43_cast_fp16 = mul(x = inputs_87_cast_fp16, y = inputs_87_cast_fp16)[name = tensor<string, []>("inputs_sq_43_cast_fp16")];
            tensor<int32, [1]> var_1597 = const()[name = tensor<string, []>("op_1597"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_43_cast_fp16 = reduce_mean(axes = var_1597, keep_dims = var_1506, x = inputs_sq_43_cast_fp16)[name = tensor<string, []>("variance_43_cast_fp16")];
            tensor<fp16, []> var_1599_to_fp16 = const()[name = tensor<string, []>("op_1599_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1600_cast_fp16 = add(x = variance_43_cast_fp16, y = var_1599_to_fp16)[name = tensor<string, []>("op_1600_cast_fp16")];
            tensor<fp16, []> var_1601_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1601_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1601_cast_fp16 = rsqrt(epsilon = var_1601_epsilon_0_to_fp16, x = var_1600_cast_fp16)[name = tensor<string, []>("op_1601_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_43_cast_fp16 = mul(x = inputs_87_cast_fp16, y = var_1601_cast_fp16)[name = tensor<string, []>("hidden_states_43_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_43_to_fp16 = const()[name = tensor<string, []>("w_43_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4257136000)))];
            tensor<fp16, [1, 4096, 1, 77]> input_63_cast_fp16 = mul(x = w_43_to_fp16, y = hidden_states_43_cast_fp16)[name = tensor<string, []>("input_63_cast_fp16")];
            tensor<int32, [2]> var_1614 = const()[name = tensor<string, []>("op_1614"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1616 = const()[name = tensor<string, []>("op_1616"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_23_pad_type_0 = const()[name = tensor<string, []>("x_23_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_23_pad_0 = const()[name = tensor<string, []>("x_23_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_10_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_10_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4257144256)))];
            tensor<fp16, [1, 10240, 1, 77]> x_23_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1616, groups = var_1507, pad = x_23_pad_0, pad_type = x_23_pad_type_0, strides = var_1614, weight = block_10_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_63_cast_fp16)[name = tensor<string, []>("x_23_cast_fp16")];
            tensor<string, []> var_1630_mode_0 = const()[name = tensor<string, []>("op_1630_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_1630_cast_fp16 = gelu(mode = var_1630_mode_0, x = x_23_cast_fp16)[name = tensor<string, []>("op_1630_cast_fp16")];
            tensor<int32, [2]> var_1633 = const()[name = tensor<string, []>("op_1633"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1635 = const()[name = tensor<string, []>("op_1635"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1637_pad_type_0 = const()[name = tensor<string, []>("op_1637_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1637_pad_0 = const()[name = tensor<string, []>("op_1637_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_10_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_10_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4341030400)))];
            tensor<fp16, [1, 10240, 1, 77]> var_1637_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1635, groups = var_1507, pad = var_1637_pad_0, pad_type = var_1637_pad_type_0, strides = var_1633, weight = block_10_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_63_cast_fp16)[name = tensor<string, []>("op_1637_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_65_cast_fp16 = mul(x = var_1630_cast_fp16, y = var_1637_cast_fp16)[name = tensor<string, []>("input_65_cast_fp16")];
            tensor<int32, [2]> var_1641 = const()[name = tensor<string, []>("op_1641"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1643 = const()[name = tensor<string, []>("op_1643"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1645_pad_type_0 = const()[name = tensor<string, []>("op_1645_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1645_pad_0 = const()[name = tensor<string, []>("op_1645_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_10_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_10_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4424916544)))];
            tensor<fp16, [1, 4096, 1, 77]> var_1645_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1643, groups = var_1507, pad = var_1645_pad_0, pad_type = var_1645_pad_type_0, strides = var_1641, weight = block_10_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_65_cast_fp16)[name = tensor<string, []>("op_1645_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_89_cast_fp16 = add(x = inputs_87_cast_fp16, y = var_1645_cast_fp16)[name = tensor<string, []>("inputs_89_cast_fp16")];
            tensor<bool, []> var_1650 = const()[name = tensor<string, []>("op_1650"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_1651 = const()[name = tensor<string, []>("op_1651"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_1655 = const()[name = tensor<string, []>("op_1655"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_1653_to_fp16 = const()[name = tensor<string, []>("op_1653_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_1652_to_fp16 = const()[name = tensor<string, []>("op_1652_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_91_cast_fp16 = clip(alpha = var_1653_to_fp16, beta = var_1652_to_fp16, x = inputs_89_cast_fp16)[name = tensor<string, []>("inputs_91_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_45_cast_fp16 = mul(x = inputs_91_cast_fp16, y = inputs_91_cast_fp16)[name = tensor<string, []>("inputs_sq_45_cast_fp16")];
            tensor<int32, [1]> var_1672 = const()[name = tensor<string, []>("op_1672"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_45_cast_fp16 = reduce_mean(axes = var_1672, keep_dims = var_1650, x = inputs_sq_45_cast_fp16)[name = tensor<string, []>("variance_45_cast_fp16")];
            tensor<fp16, []> var_1674_to_fp16 = const()[name = tensor<string, []>("op_1674_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1675_cast_fp16 = add(x = variance_45_cast_fp16, y = var_1674_to_fp16)[name = tensor<string, []>("op_1675_cast_fp16")];
            tensor<fp16, []> var_1676_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1676_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1676_cast_fp16 = rsqrt(epsilon = var_1676_epsilon_0_to_fp16, x = var_1675_cast_fp16)[name = tensor<string, []>("op_1676_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_45_cast_fp16 = mul(x = inputs_91_cast_fp16, y = var_1676_cast_fp16)[name = tensor<string, []>("hidden_states_45_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_45_to_fp16 = const()[name = tensor<string, []>("w_45_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4508802688)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_47_cast_fp16 = mul(x = w_45_to_fp16, y = hidden_states_45_cast_fp16)[name = tensor<string, []>("obj_47_cast_fp16")];
            tensor<int32, [2]> var_1690 = const()[name = tensor<string, []>("op_1690"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1692 = const()[name = tensor<string, []>("op_1692"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_23_pad_type_0 = const()[name = tensor<string, []>("query_23_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_23_pad_0 = const()[name = tensor<string, []>("query_23_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_11_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_11_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4508810944)))];
            tensor<fp16, [1, 4096, 1, 77]> query_23_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1692, groups = var_1651, pad = query_23_pad_0, pad_type = query_23_pad_type_0, strides = var_1690, weight = block_11_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_47_cast_fp16)[name = tensor<string, []>("query_23_cast_fp16")];
            tensor<int32, [2]> var_1696 = const()[name = tensor<string, []>("op_1696"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1698 = const()[name = tensor<string, []>("op_1698"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_23_pad_type_0 = const()[name = tensor<string, []>("key_23_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_23_pad_0 = const()[name = tensor<string, []>("key_23_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_11_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_11_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4542365440)))];
            tensor<fp16, [1, 4096, 1, 77]> key_23_cast_fp16 = conv(dilations = var_1698, groups = var_1651, pad = key_23_pad_0, pad_type = key_23_pad_type_0, strides = var_1696, weight = block_11_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_47_cast_fp16)[name = tensor<string, []>("key_23_cast_fp16")];
            tensor<int32, [2]> var_1703 = const()[name = tensor<string, []>("op_1703"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1705 = const()[name = tensor<string, []>("op_1705"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_23_pad_type_0 = const()[name = tensor<string, []>("value_23_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_23_pad_0 = const()[name = tensor<string, []>("value_23_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_11_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_11_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4575919936)))];
            tensor<fp16, [1, 4096, 1, 77]> value_23_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1705, groups = var_1651, pad = value_23_pad_0, pad_type = value_23_pad_type_0, strides = var_1703, weight = block_11_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_47_cast_fp16)[name = tensor<string, []>("value_23_cast_fp16")];
            tensor<int32, [4]> var_1709 = const()[name = tensor<string, []>("op_1709"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1710_cast_fp16 = reshape(shape = var_1709, x = query_23_cast_fp16)[name = tensor<string, []>("op_1710_cast_fp16")];
            tensor<int32, [4]> var_1711 = const()[name = tensor<string, []>("op_1711"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1712_cast_fp16 = reshape(shape = var_1711, x = key_23_cast_fp16)[name = tensor<string, []>("op_1712_cast_fp16")];
            tensor<bool, []> mh_w_67_transpose_x_0 = const()[name = tensor<string, []>("mh_w_67_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_67_transpose_y_0 = const()[name = tensor<string, []>("mh_w_67_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_67_cast_fp16 = matmul(transpose_x = mh_w_67_transpose_x_0, transpose_y = mh_w_67_transpose_y_0, x = var_1710_cast_fp16, y = var_1712_cast_fp16)[name = tensor<string, []>("mh_w_67_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_69_cast_fp16 = add(x = mh_w_67_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_69_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_71_cast_fp16 = add(x = mh_w_69_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_71_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_1721_cast_fp16 = softmax(axis = var_1655, x = mh_w_71_cast_fp16)[name = tensor<string, []>("op_1721_cast_fp16")];
            tensor<int32, [4]> var_1722 = const()[name = tensor<string, []>("op_1722"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1723_cast_fp16 = reshape(shape = var_1722, x = value_23_cast_fp16)[name = tensor<string, []>("op_1723_cast_fp16")];
            tensor<bool, []> attn_23_transpose_x_0 = const()[name = tensor<string, []>("attn_23_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_23_transpose_y_0 = const()[name = tensor<string, []>("attn_23_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_23_cast_fp16 = matmul(transpose_x = attn_23_transpose_x_0, transpose_y = attn_23_transpose_y_0, x = var_1723_cast_fp16, y = var_1721_cast_fp16)[name = tensor<string, []>("attn_23_cast_fp16")];
            tensor<int32, [4]> var_1726 = const()[name = tensor<string, []>("op_1726"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_67_cast_fp16 = reshape(shape = var_1726, x = attn_23_cast_fp16)[name = tensor<string, []>("input_67_cast_fp16")];
            tensor<int32, [2]> var_1730 = const()[name = tensor<string, []>("op_1730"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1732 = const()[name = tensor<string, []>("op_1732"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_49_pad_type_0 = const()[name = tensor<string, []>("obj_49_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_49_pad_0 = const()[name = tensor<string, []>("obj_49_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_11_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_11_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4609474432)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_49_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1732, groups = var_1651, pad = obj_49_pad_0, pad_type = obj_49_pad_type_0, strides = var_1730, weight = block_11_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_67_cast_fp16)[name = tensor<string, []>("obj_49_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_93_cast_fp16 = add(x = inputs_91_cast_fp16, y = obj_49_cast_fp16)[name = tensor<string, []>("inputs_93_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_95_cast_fp16 = clip(alpha = var_1653_to_fp16, beta = var_1652_to_fp16, x = inputs_93_cast_fp16)[name = tensor<string, []>("inputs_95_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_47_cast_fp16 = mul(x = inputs_95_cast_fp16, y = inputs_95_cast_fp16)[name = tensor<string, []>("inputs_sq_47_cast_fp16")];
            tensor<int32, [1]> var_1741 = const()[name = tensor<string, []>("op_1741"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_47_cast_fp16 = reduce_mean(axes = var_1741, keep_dims = var_1650, x = inputs_sq_47_cast_fp16)[name = tensor<string, []>("variance_47_cast_fp16")];
            tensor<fp16, []> var_1743_to_fp16 = const()[name = tensor<string, []>("op_1743_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1744_cast_fp16 = add(x = variance_47_cast_fp16, y = var_1743_to_fp16)[name = tensor<string, []>("op_1744_cast_fp16")];
            tensor<fp16, []> var_1745_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1745_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1745_cast_fp16 = rsqrt(epsilon = var_1745_epsilon_0_to_fp16, x = var_1744_cast_fp16)[name = tensor<string, []>("op_1745_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_47_cast_fp16 = mul(x = inputs_95_cast_fp16, y = var_1745_cast_fp16)[name = tensor<string, []>("hidden_states_47_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_47_to_fp16 = const()[name = tensor<string, []>("w_47_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4643028928)))];
            tensor<fp16, [1, 4096, 1, 77]> input_69_cast_fp16 = mul(x = w_47_to_fp16, y = hidden_states_47_cast_fp16)[name = tensor<string, []>("input_69_cast_fp16")];
            tensor<int32, [2]> var_1758 = const()[name = tensor<string, []>("op_1758"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1760 = const()[name = tensor<string, []>("op_1760"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_25_pad_type_0 = const()[name = tensor<string, []>("x_25_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_25_pad_0 = const()[name = tensor<string, []>("x_25_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_11_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_11_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4643037184)))];
            tensor<fp16, [1, 10240, 1, 77]> x_25_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1760, groups = var_1651, pad = x_25_pad_0, pad_type = x_25_pad_type_0, strides = var_1758, weight = block_11_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_69_cast_fp16)[name = tensor<string, []>("x_25_cast_fp16")];
            tensor<string, []> var_1774_mode_0 = const()[name = tensor<string, []>("op_1774_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_1774_cast_fp16 = gelu(mode = var_1774_mode_0, x = x_25_cast_fp16)[name = tensor<string, []>("op_1774_cast_fp16")];
            tensor<int32, [2]> var_1777 = const()[name = tensor<string, []>("op_1777"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1779 = const()[name = tensor<string, []>("op_1779"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1781_pad_type_0 = const()[name = tensor<string, []>("op_1781_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1781_pad_0 = const()[name = tensor<string, []>("op_1781_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_11_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_11_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4726923328)))];
            tensor<fp16, [1, 10240, 1, 77]> var_1781_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1779, groups = var_1651, pad = var_1781_pad_0, pad_type = var_1781_pad_type_0, strides = var_1777, weight = block_11_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_69_cast_fp16)[name = tensor<string, []>("op_1781_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_71_cast_fp16 = mul(x = var_1774_cast_fp16, y = var_1781_cast_fp16)[name = tensor<string, []>("input_71_cast_fp16")];
            tensor<int32, [2]> var_1785 = const()[name = tensor<string, []>("op_1785"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1787 = const()[name = tensor<string, []>("op_1787"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1789_pad_type_0 = const()[name = tensor<string, []>("op_1789_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1789_pad_0 = const()[name = tensor<string, []>("op_1789_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_11_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_11_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4810809472)))];
            tensor<fp16, [1, 4096, 1, 77]> var_1789_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1787, groups = var_1651, pad = var_1789_pad_0, pad_type = var_1789_pad_type_0, strides = var_1785, weight = block_11_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_71_cast_fp16)[name = tensor<string, []>("op_1789_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_97_cast_fp16 = add(x = inputs_95_cast_fp16, y = var_1789_cast_fp16)[name = tensor<string, []>("inputs_97_cast_fp16")];
            tensor<bool, []> var_1794 = const()[name = tensor<string, []>("op_1794"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_1795 = const()[name = tensor<string, []>("op_1795"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_1799 = const()[name = tensor<string, []>("op_1799"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_1797_to_fp16 = const()[name = tensor<string, []>("op_1797_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_1796_to_fp16 = const()[name = tensor<string, []>("op_1796_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_99_cast_fp16 = clip(alpha = var_1797_to_fp16, beta = var_1796_to_fp16, x = inputs_97_cast_fp16)[name = tensor<string, []>("inputs_99_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_49_cast_fp16 = mul(x = inputs_99_cast_fp16, y = inputs_99_cast_fp16)[name = tensor<string, []>("inputs_sq_49_cast_fp16")];
            tensor<int32, [1]> var_1816 = const()[name = tensor<string, []>("op_1816"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_49_cast_fp16 = reduce_mean(axes = var_1816, keep_dims = var_1794, x = inputs_sq_49_cast_fp16)[name = tensor<string, []>("variance_49_cast_fp16")];
            tensor<fp16, []> var_1818_to_fp16 = const()[name = tensor<string, []>("op_1818_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1819_cast_fp16 = add(x = variance_49_cast_fp16, y = var_1818_to_fp16)[name = tensor<string, []>("op_1819_cast_fp16")];
            tensor<fp16, []> var_1820_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1820_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1820_cast_fp16 = rsqrt(epsilon = var_1820_epsilon_0_to_fp16, x = var_1819_cast_fp16)[name = tensor<string, []>("op_1820_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_49_cast_fp16 = mul(x = inputs_99_cast_fp16, y = var_1820_cast_fp16)[name = tensor<string, []>("hidden_states_49_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_49_to_fp16 = const()[name = tensor<string, []>("w_49_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4894695616)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_51_cast_fp16 = mul(x = w_49_to_fp16, y = hidden_states_49_cast_fp16)[name = tensor<string, []>("obj_51_cast_fp16")];
            tensor<int32, [2]> var_1834 = const()[name = tensor<string, []>("op_1834"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1836 = const()[name = tensor<string, []>("op_1836"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_25_pad_type_0 = const()[name = tensor<string, []>("query_25_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_25_pad_0 = const()[name = tensor<string, []>("query_25_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_12_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_12_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4894703872)))];
            tensor<fp16, [1, 4096, 1, 77]> query_25_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1836, groups = var_1795, pad = query_25_pad_0, pad_type = query_25_pad_type_0, strides = var_1834, weight = block_12_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_51_cast_fp16)[name = tensor<string, []>("query_25_cast_fp16")];
            tensor<int32, [2]> var_1840 = const()[name = tensor<string, []>("op_1840"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1842 = const()[name = tensor<string, []>("op_1842"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_25_pad_type_0 = const()[name = tensor<string, []>("key_25_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_25_pad_0 = const()[name = tensor<string, []>("key_25_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_12_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_12_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4928258368)))];
            tensor<fp16, [1, 4096, 1, 77]> key_25_cast_fp16 = conv(dilations = var_1842, groups = var_1795, pad = key_25_pad_0, pad_type = key_25_pad_type_0, strides = var_1840, weight = block_12_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_51_cast_fp16)[name = tensor<string, []>("key_25_cast_fp16")];
            tensor<int32, [2]> var_1847 = const()[name = tensor<string, []>("op_1847"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1849 = const()[name = tensor<string, []>("op_1849"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_25_pad_type_0 = const()[name = tensor<string, []>("value_25_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_25_pad_0 = const()[name = tensor<string, []>("value_25_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_12_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_12_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4961812864)))];
            tensor<fp16, [1, 4096, 1, 77]> value_25_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1849, groups = var_1795, pad = value_25_pad_0, pad_type = value_25_pad_type_0, strides = var_1847, weight = block_12_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_51_cast_fp16)[name = tensor<string, []>("value_25_cast_fp16")];
            tensor<int32, [4]> var_1853 = const()[name = tensor<string, []>("op_1853"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1854_cast_fp16 = reshape(shape = var_1853, x = query_25_cast_fp16)[name = tensor<string, []>("op_1854_cast_fp16")];
            tensor<int32, [4]> var_1855 = const()[name = tensor<string, []>("op_1855"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1856_cast_fp16 = reshape(shape = var_1855, x = key_25_cast_fp16)[name = tensor<string, []>("op_1856_cast_fp16")];
            tensor<bool, []> mh_w_73_transpose_x_0 = const()[name = tensor<string, []>("mh_w_73_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_73_transpose_y_0 = const()[name = tensor<string, []>("mh_w_73_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_73_cast_fp16 = matmul(transpose_x = mh_w_73_transpose_x_0, transpose_y = mh_w_73_transpose_y_0, x = var_1854_cast_fp16, y = var_1856_cast_fp16)[name = tensor<string, []>("mh_w_73_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_75_cast_fp16 = add(x = mh_w_73_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_75_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_77_cast_fp16 = add(x = mh_w_75_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_77_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_1865_cast_fp16 = softmax(axis = var_1799, x = mh_w_77_cast_fp16)[name = tensor<string, []>("op_1865_cast_fp16")];
            tensor<int32, [4]> var_1866 = const()[name = tensor<string, []>("op_1866"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1867_cast_fp16 = reshape(shape = var_1866, x = value_25_cast_fp16)[name = tensor<string, []>("op_1867_cast_fp16")];
            tensor<bool, []> attn_25_transpose_x_0 = const()[name = tensor<string, []>("attn_25_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_25_transpose_y_0 = const()[name = tensor<string, []>("attn_25_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_25_cast_fp16 = matmul(transpose_x = attn_25_transpose_x_0, transpose_y = attn_25_transpose_y_0, x = var_1867_cast_fp16, y = var_1865_cast_fp16)[name = tensor<string, []>("attn_25_cast_fp16")];
            tensor<int32, [4]> var_1870 = const()[name = tensor<string, []>("op_1870"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_73_cast_fp16 = reshape(shape = var_1870, x = attn_25_cast_fp16)[name = tensor<string, []>("input_73_cast_fp16")];
            tensor<int32, [2]> var_1874 = const()[name = tensor<string, []>("op_1874"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1876 = const()[name = tensor<string, []>("op_1876"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_53_pad_type_0 = const()[name = tensor<string, []>("obj_53_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_53_pad_0 = const()[name = tensor<string, []>("obj_53_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_12_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_12_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4995367360)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_53_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1876, groups = var_1795, pad = obj_53_pad_0, pad_type = obj_53_pad_type_0, strides = var_1874, weight = block_12_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_73_cast_fp16)[name = tensor<string, []>("obj_53_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_101_cast_fp16 = add(x = inputs_99_cast_fp16, y = obj_53_cast_fp16)[name = tensor<string, []>("inputs_101_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_103_cast_fp16 = clip(alpha = var_1797_to_fp16, beta = var_1796_to_fp16, x = inputs_101_cast_fp16)[name = tensor<string, []>("inputs_103_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_51_cast_fp16 = mul(x = inputs_103_cast_fp16, y = inputs_103_cast_fp16)[name = tensor<string, []>("inputs_sq_51_cast_fp16")];
            tensor<int32, [1]> var_1885 = const()[name = tensor<string, []>("op_1885"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_51_cast_fp16 = reduce_mean(axes = var_1885, keep_dims = var_1794, x = inputs_sq_51_cast_fp16)[name = tensor<string, []>("variance_51_cast_fp16")];
            tensor<fp16, []> var_1887_to_fp16 = const()[name = tensor<string, []>("op_1887_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1888_cast_fp16 = add(x = variance_51_cast_fp16, y = var_1887_to_fp16)[name = tensor<string, []>("op_1888_cast_fp16")];
            tensor<fp16, []> var_1889_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1889_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1889_cast_fp16 = rsqrt(epsilon = var_1889_epsilon_0_to_fp16, x = var_1888_cast_fp16)[name = tensor<string, []>("op_1889_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_51_cast_fp16 = mul(x = inputs_103_cast_fp16, y = var_1889_cast_fp16)[name = tensor<string, []>("hidden_states_51_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_51_to_fp16 = const()[name = tensor<string, []>("w_51_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5028921856)))];
            tensor<fp16, [1, 4096, 1, 77]> input_75_cast_fp16 = mul(x = w_51_to_fp16, y = hidden_states_51_cast_fp16)[name = tensor<string, []>("input_75_cast_fp16")];
            tensor<int32, [2]> var_1902 = const()[name = tensor<string, []>("op_1902"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1904 = const()[name = tensor<string, []>("op_1904"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_27_pad_type_0 = const()[name = tensor<string, []>("x_27_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_27_pad_0 = const()[name = tensor<string, []>("x_27_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_12_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_12_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5028930112)))];
            tensor<fp16, [1, 10240, 1, 77]> x_27_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1904, groups = var_1795, pad = x_27_pad_0, pad_type = x_27_pad_type_0, strides = var_1902, weight = block_12_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_75_cast_fp16)[name = tensor<string, []>("x_27_cast_fp16")];
            tensor<string, []> var_1918_mode_0 = const()[name = tensor<string, []>("op_1918_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_1918_cast_fp16 = gelu(mode = var_1918_mode_0, x = x_27_cast_fp16)[name = tensor<string, []>("op_1918_cast_fp16")];
            tensor<int32, [2]> var_1921 = const()[name = tensor<string, []>("op_1921"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1923 = const()[name = tensor<string, []>("op_1923"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1925_pad_type_0 = const()[name = tensor<string, []>("op_1925_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1925_pad_0 = const()[name = tensor<string, []>("op_1925_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_12_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_12_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5112816256)))];
            tensor<fp16, [1, 10240, 1, 77]> var_1925_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_1923, groups = var_1795, pad = var_1925_pad_0, pad_type = var_1925_pad_type_0, strides = var_1921, weight = block_12_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_75_cast_fp16)[name = tensor<string, []>("op_1925_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_77_cast_fp16 = mul(x = var_1918_cast_fp16, y = var_1925_cast_fp16)[name = tensor<string, []>("input_77_cast_fp16")];
            tensor<int32, [2]> var_1929 = const()[name = tensor<string, []>("op_1929"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1931 = const()[name = tensor<string, []>("op_1931"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_1933_pad_type_0 = const()[name = tensor<string, []>("op_1933_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_1933_pad_0 = const()[name = tensor<string, []>("op_1933_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_12_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_12_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5196702400)))];
            tensor<fp16, [1, 4096, 1, 77]> var_1933_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1931, groups = var_1795, pad = var_1933_pad_0, pad_type = var_1933_pad_type_0, strides = var_1929, weight = block_12_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_77_cast_fp16)[name = tensor<string, []>("op_1933_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_105_cast_fp16 = add(x = inputs_103_cast_fp16, y = var_1933_cast_fp16)[name = tensor<string, []>("inputs_105_cast_fp16")];
            tensor<bool, []> var_1938 = const()[name = tensor<string, []>("op_1938"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_1939 = const()[name = tensor<string, []>("op_1939"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_1943 = const()[name = tensor<string, []>("op_1943"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_1941_to_fp16 = const()[name = tensor<string, []>("op_1941_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_1940_to_fp16 = const()[name = tensor<string, []>("op_1940_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_107_cast_fp16 = clip(alpha = var_1941_to_fp16, beta = var_1940_to_fp16, x = inputs_105_cast_fp16)[name = tensor<string, []>("inputs_107_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_53_cast_fp16 = mul(x = inputs_107_cast_fp16, y = inputs_107_cast_fp16)[name = tensor<string, []>("inputs_sq_53_cast_fp16")];
            tensor<int32, [1]> var_1960 = const()[name = tensor<string, []>("op_1960"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_53_cast_fp16 = reduce_mean(axes = var_1960, keep_dims = var_1938, x = inputs_sq_53_cast_fp16)[name = tensor<string, []>("variance_53_cast_fp16")];
            tensor<fp16, []> var_1962_to_fp16 = const()[name = tensor<string, []>("op_1962_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_1963_cast_fp16 = add(x = variance_53_cast_fp16, y = var_1962_to_fp16)[name = tensor<string, []>("op_1963_cast_fp16")];
            tensor<fp16, []> var_1964_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_1964_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_1964_cast_fp16 = rsqrt(epsilon = var_1964_epsilon_0_to_fp16, x = var_1963_cast_fp16)[name = tensor<string, []>("op_1964_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_53_cast_fp16 = mul(x = inputs_107_cast_fp16, y = var_1964_cast_fp16)[name = tensor<string, []>("hidden_states_53_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_53_to_fp16 = const()[name = tensor<string, []>("w_53_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5280588544)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_55_cast_fp16 = mul(x = w_53_to_fp16, y = hidden_states_53_cast_fp16)[name = tensor<string, []>("obj_55_cast_fp16")];
            tensor<int32, [2]> var_1978 = const()[name = tensor<string, []>("op_1978"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1980 = const()[name = tensor<string, []>("op_1980"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_27_pad_type_0 = const()[name = tensor<string, []>("query_27_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_27_pad_0 = const()[name = tensor<string, []>("query_27_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_13_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_13_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5280596800)))];
            tensor<fp16, [1, 4096, 1, 77]> query_27_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1980, groups = var_1939, pad = query_27_pad_0, pad_type = query_27_pad_type_0, strides = var_1978, weight = block_13_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_55_cast_fp16)[name = tensor<string, []>("query_27_cast_fp16")];
            tensor<int32, [2]> var_1984 = const()[name = tensor<string, []>("op_1984"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1986 = const()[name = tensor<string, []>("op_1986"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_27_pad_type_0 = const()[name = tensor<string, []>("key_27_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_27_pad_0 = const()[name = tensor<string, []>("key_27_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_13_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_13_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5314151296)))];
            tensor<fp16, [1, 4096, 1, 77]> key_27_cast_fp16 = conv(dilations = var_1986, groups = var_1939, pad = key_27_pad_0, pad_type = key_27_pad_type_0, strides = var_1984, weight = block_13_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_55_cast_fp16)[name = tensor<string, []>("key_27_cast_fp16")];
            tensor<int32, [2]> var_1991 = const()[name = tensor<string, []>("op_1991"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1993 = const()[name = tensor<string, []>("op_1993"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_27_pad_type_0 = const()[name = tensor<string, []>("value_27_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_27_pad_0 = const()[name = tensor<string, []>("value_27_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_13_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_13_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5347705792)))];
            tensor<fp16, [1, 4096, 1, 77]> value_27_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_1993, groups = var_1939, pad = value_27_pad_0, pad_type = value_27_pad_type_0, strides = var_1991, weight = block_13_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_55_cast_fp16)[name = tensor<string, []>("value_27_cast_fp16")];
            tensor<int32, [4]> var_1997 = const()[name = tensor<string, []>("op_1997"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_1998_cast_fp16 = reshape(shape = var_1997, x = query_27_cast_fp16)[name = tensor<string, []>("op_1998_cast_fp16")];
            tensor<int32, [4]> var_1999 = const()[name = tensor<string, []>("op_1999"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2000_cast_fp16 = reshape(shape = var_1999, x = key_27_cast_fp16)[name = tensor<string, []>("op_2000_cast_fp16")];
            tensor<bool, []> mh_w_79_transpose_x_0 = const()[name = tensor<string, []>("mh_w_79_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_79_transpose_y_0 = const()[name = tensor<string, []>("mh_w_79_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_79_cast_fp16 = matmul(transpose_x = mh_w_79_transpose_x_0, transpose_y = mh_w_79_transpose_y_0, x = var_1998_cast_fp16, y = var_2000_cast_fp16)[name = tensor<string, []>("mh_w_79_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_81_cast_fp16 = add(x = mh_w_79_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_81_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_83_cast_fp16 = add(x = mh_w_81_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_83_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_2009_cast_fp16 = softmax(axis = var_1943, x = mh_w_83_cast_fp16)[name = tensor<string, []>("op_2009_cast_fp16")];
            tensor<int32, [4]> var_2010 = const()[name = tensor<string, []>("op_2010"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2011_cast_fp16 = reshape(shape = var_2010, x = value_27_cast_fp16)[name = tensor<string, []>("op_2011_cast_fp16")];
            tensor<bool, []> attn_27_transpose_x_0 = const()[name = tensor<string, []>("attn_27_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_27_transpose_y_0 = const()[name = tensor<string, []>("attn_27_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_27_cast_fp16 = matmul(transpose_x = attn_27_transpose_x_0, transpose_y = attn_27_transpose_y_0, x = var_2011_cast_fp16, y = var_2009_cast_fp16)[name = tensor<string, []>("attn_27_cast_fp16")];
            tensor<int32, [4]> var_2014 = const()[name = tensor<string, []>("op_2014"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_79_cast_fp16 = reshape(shape = var_2014, x = attn_27_cast_fp16)[name = tensor<string, []>("input_79_cast_fp16")];
            tensor<int32, [2]> var_2018 = const()[name = tensor<string, []>("op_2018"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2020 = const()[name = tensor<string, []>("op_2020"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_57_pad_type_0 = const()[name = tensor<string, []>("obj_57_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_57_pad_0 = const()[name = tensor<string, []>("obj_57_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_13_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_13_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5381260288)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_57_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2020, groups = var_1939, pad = obj_57_pad_0, pad_type = obj_57_pad_type_0, strides = var_2018, weight = block_13_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_79_cast_fp16)[name = tensor<string, []>("obj_57_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_109_cast_fp16 = add(x = inputs_107_cast_fp16, y = obj_57_cast_fp16)[name = tensor<string, []>("inputs_109_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_111_cast_fp16 = clip(alpha = var_1941_to_fp16, beta = var_1940_to_fp16, x = inputs_109_cast_fp16)[name = tensor<string, []>("inputs_111_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_55_cast_fp16 = mul(x = inputs_111_cast_fp16, y = inputs_111_cast_fp16)[name = tensor<string, []>("inputs_sq_55_cast_fp16")];
            tensor<int32, [1]> var_2029 = const()[name = tensor<string, []>("op_2029"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_55_cast_fp16 = reduce_mean(axes = var_2029, keep_dims = var_1938, x = inputs_sq_55_cast_fp16)[name = tensor<string, []>("variance_55_cast_fp16")];
            tensor<fp16, []> var_2031_to_fp16 = const()[name = tensor<string, []>("op_2031_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2032_cast_fp16 = add(x = variance_55_cast_fp16, y = var_2031_to_fp16)[name = tensor<string, []>("op_2032_cast_fp16")];
            tensor<fp16, []> var_2033_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2033_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2033_cast_fp16 = rsqrt(epsilon = var_2033_epsilon_0_to_fp16, x = var_2032_cast_fp16)[name = tensor<string, []>("op_2033_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_55_cast_fp16 = mul(x = inputs_111_cast_fp16, y = var_2033_cast_fp16)[name = tensor<string, []>("hidden_states_55_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_55_to_fp16 = const()[name = tensor<string, []>("w_55_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5414814784)))];
            tensor<fp16, [1, 4096, 1, 77]> input_81_cast_fp16 = mul(x = w_55_to_fp16, y = hidden_states_55_cast_fp16)[name = tensor<string, []>("input_81_cast_fp16")];
            tensor<int32, [2]> var_2046 = const()[name = tensor<string, []>("op_2046"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2048 = const()[name = tensor<string, []>("op_2048"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_29_pad_type_0 = const()[name = tensor<string, []>("x_29_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_29_pad_0 = const()[name = tensor<string, []>("x_29_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_13_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_13_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5414823040)))];
            tensor<fp16, [1, 10240, 1, 77]> x_29_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2048, groups = var_1939, pad = x_29_pad_0, pad_type = x_29_pad_type_0, strides = var_2046, weight = block_13_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_81_cast_fp16)[name = tensor<string, []>("x_29_cast_fp16")];
            tensor<string, []> var_2062_mode_0 = const()[name = tensor<string, []>("op_2062_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_2062_cast_fp16 = gelu(mode = var_2062_mode_0, x = x_29_cast_fp16)[name = tensor<string, []>("op_2062_cast_fp16")];
            tensor<int32, [2]> var_2065 = const()[name = tensor<string, []>("op_2065"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2067 = const()[name = tensor<string, []>("op_2067"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2069_pad_type_0 = const()[name = tensor<string, []>("op_2069_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2069_pad_0 = const()[name = tensor<string, []>("op_2069_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_13_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_13_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5498709184)))];
            tensor<fp16, [1, 10240, 1, 77]> var_2069_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2067, groups = var_1939, pad = var_2069_pad_0, pad_type = var_2069_pad_type_0, strides = var_2065, weight = block_13_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_81_cast_fp16)[name = tensor<string, []>("op_2069_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_83_cast_fp16 = mul(x = var_2062_cast_fp16, y = var_2069_cast_fp16)[name = tensor<string, []>("input_83_cast_fp16")];
            tensor<int32, [2]> var_2073 = const()[name = tensor<string, []>("op_2073"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2075 = const()[name = tensor<string, []>("op_2075"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2077_pad_type_0 = const()[name = tensor<string, []>("op_2077_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2077_pad_0 = const()[name = tensor<string, []>("op_2077_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_13_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_13_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5582595328)))];
            tensor<fp16, [1, 4096, 1, 77]> var_2077_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2075, groups = var_1939, pad = var_2077_pad_0, pad_type = var_2077_pad_type_0, strides = var_2073, weight = block_13_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_83_cast_fp16)[name = tensor<string, []>("op_2077_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_113_cast_fp16 = add(x = inputs_111_cast_fp16, y = var_2077_cast_fp16)[name = tensor<string, []>("inputs_113_cast_fp16")];
            tensor<bool, []> var_2082 = const()[name = tensor<string, []>("op_2082"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_2083 = const()[name = tensor<string, []>("op_2083"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_2087 = const()[name = tensor<string, []>("op_2087"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_2085_to_fp16 = const()[name = tensor<string, []>("op_2085_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_2084_to_fp16 = const()[name = tensor<string, []>("op_2084_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_115_cast_fp16 = clip(alpha = var_2085_to_fp16, beta = var_2084_to_fp16, x = inputs_113_cast_fp16)[name = tensor<string, []>("inputs_115_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_57_cast_fp16 = mul(x = inputs_115_cast_fp16, y = inputs_115_cast_fp16)[name = tensor<string, []>("inputs_sq_57_cast_fp16")];
            tensor<int32, [1]> var_2104 = const()[name = tensor<string, []>("op_2104"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_57_cast_fp16 = reduce_mean(axes = var_2104, keep_dims = var_2082, x = inputs_sq_57_cast_fp16)[name = tensor<string, []>("variance_57_cast_fp16")];
            tensor<fp16, []> var_2106_to_fp16 = const()[name = tensor<string, []>("op_2106_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2107_cast_fp16 = add(x = variance_57_cast_fp16, y = var_2106_to_fp16)[name = tensor<string, []>("op_2107_cast_fp16")];
            tensor<fp16, []> var_2108_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2108_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2108_cast_fp16 = rsqrt(epsilon = var_2108_epsilon_0_to_fp16, x = var_2107_cast_fp16)[name = tensor<string, []>("op_2108_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_57_cast_fp16 = mul(x = inputs_115_cast_fp16, y = var_2108_cast_fp16)[name = tensor<string, []>("hidden_states_57_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_57_to_fp16 = const()[name = tensor<string, []>("w_57_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5666481472)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_59_cast_fp16 = mul(x = w_57_to_fp16, y = hidden_states_57_cast_fp16)[name = tensor<string, []>("obj_59_cast_fp16")];
            tensor<int32, [2]> var_2122 = const()[name = tensor<string, []>("op_2122"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2124 = const()[name = tensor<string, []>("op_2124"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_29_pad_type_0 = const()[name = tensor<string, []>("query_29_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_29_pad_0 = const()[name = tensor<string, []>("query_29_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_14_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_14_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5666489728)))];
            tensor<fp16, [1, 4096, 1, 77]> query_29_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2124, groups = var_2083, pad = query_29_pad_0, pad_type = query_29_pad_type_0, strides = var_2122, weight = block_14_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_59_cast_fp16)[name = tensor<string, []>("query_29_cast_fp16")];
            tensor<int32, [2]> var_2128 = const()[name = tensor<string, []>("op_2128"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2130 = const()[name = tensor<string, []>("op_2130"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_29_pad_type_0 = const()[name = tensor<string, []>("key_29_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_29_pad_0 = const()[name = tensor<string, []>("key_29_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_14_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_14_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5700044224)))];
            tensor<fp16, [1, 4096, 1, 77]> key_29_cast_fp16 = conv(dilations = var_2130, groups = var_2083, pad = key_29_pad_0, pad_type = key_29_pad_type_0, strides = var_2128, weight = block_14_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_59_cast_fp16)[name = tensor<string, []>("key_29_cast_fp16")];
            tensor<int32, [2]> var_2135 = const()[name = tensor<string, []>("op_2135"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2137 = const()[name = tensor<string, []>("op_2137"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_29_pad_type_0 = const()[name = tensor<string, []>("value_29_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_29_pad_0 = const()[name = tensor<string, []>("value_29_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_14_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_14_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5733598720)))];
            tensor<fp16, [1, 4096, 1, 77]> value_29_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2137, groups = var_2083, pad = value_29_pad_0, pad_type = value_29_pad_type_0, strides = var_2135, weight = block_14_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_59_cast_fp16)[name = tensor<string, []>("value_29_cast_fp16")];
            tensor<int32, [4]> var_2141 = const()[name = tensor<string, []>("op_2141"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2142_cast_fp16 = reshape(shape = var_2141, x = query_29_cast_fp16)[name = tensor<string, []>("op_2142_cast_fp16")];
            tensor<int32, [4]> var_2143 = const()[name = tensor<string, []>("op_2143"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2144_cast_fp16 = reshape(shape = var_2143, x = key_29_cast_fp16)[name = tensor<string, []>("op_2144_cast_fp16")];
            tensor<bool, []> mh_w_85_transpose_x_0 = const()[name = tensor<string, []>("mh_w_85_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_85_transpose_y_0 = const()[name = tensor<string, []>("mh_w_85_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_85_cast_fp16 = matmul(transpose_x = mh_w_85_transpose_x_0, transpose_y = mh_w_85_transpose_y_0, x = var_2142_cast_fp16, y = var_2144_cast_fp16)[name = tensor<string, []>("mh_w_85_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_87_cast_fp16 = add(x = mh_w_85_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_87_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_89_cast_fp16 = add(x = mh_w_87_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_89_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_2153_cast_fp16 = softmax(axis = var_2087, x = mh_w_89_cast_fp16)[name = tensor<string, []>("op_2153_cast_fp16")];
            tensor<int32, [4]> var_2154 = const()[name = tensor<string, []>("op_2154"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2155_cast_fp16 = reshape(shape = var_2154, x = value_29_cast_fp16)[name = tensor<string, []>("op_2155_cast_fp16")];
            tensor<bool, []> attn_29_transpose_x_0 = const()[name = tensor<string, []>("attn_29_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_29_transpose_y_0 = const()[name = tensor<string, []>("attn_29_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_29_cast_fp16 = matmul(transpose_x = attn_29_transpose_x_0, transpose_y = attn_29_transpose_y_0, x = var_2155_cast_fp16, y = var_2153_cast_fp16)[name = tensor<string, []>("attn_29_cast_fp16")];
            tensor<int32, [4]> var_2158 = const()[name = tensor<string, []>("op_2158"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_85_cast_fp16 = reshape(shape = var_2158, x = attn_29_cast_fp16)[name = tensor<string, []>("input_85_cast_fp16")];
            tensor<int32, [2]> var_2162 = const()[name = tensor<string, []>("op_2162"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2164 = const()[name = tensor<string, []>("op_2164"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_61_pad_type_0 = const()[name = tensor<string, []>("obj_61_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_61_pad_0 = const()[name = tensor<string, []>("obj_61_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_14_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_14_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5767153216)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_61_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2164, groups = var_2083, pad = obj_61_pad_0, pad_type = obj_61_pad_type_0, strides = var_2162, weight = block_14_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_85_cast_fp16)[name = tensor<string, []>("obj_61_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_117_cast_fp16 = add(x = inputs_115_cast_fp16, y = obj_61_cast_fp16)[name = tensor<string, []>("inputs_117_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_119_cast_fp16 = clip(alpha = var_2085_to_fp16, beta = var_2084_to_fp16, x = inputs_117_cast_fp16)[name = tensor<string, []>("inputs_119_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_59_cast_fp16 = mul(x = inputs_119_cast_fp16, y = inputs_119_cast_fp16)[name = tensor<string, []>("inputs_sq_59_cast_fp16")];
            tensor<int32, [1]> var_2173 = const()[name = tensor<string, []>("op_2173"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_59_cast_fp16 = reduce_mean(axes = var_2173, keep_dims = var_2082, x = inputs_sq_59_cast_fp16)[name = tensor<string, []>("variance_59_cast_fp16")];
            tensor<fp16, []> var_2175_to_fp16 = const()[name = tensor<string, []>("op_2175_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2176_cast_fp16 = add(x = variance_59_cast_fp16, y = var_2175_to_fp16)[name = tensor<string, []>("op_2176_cast_fp16")];
            tensor<fp16, []> var_2177_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2177_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2177_cast_fp16 = rsqrt(epsilon = var_2177_epsilon_0_to_fp16, x = var_2176_cast_fp16)[name = tensor<string, []>("op_2177_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_59_cast_fp16 = mul(x = inputs_119_cast_fp16, y = var_2177_cast_fp16)[name = tensor<string, []>("hidden_states_59_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_59_to_fp16 = const()[name = tensor<string, []>("w_59_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5800707712)))];
            tensor<fp16, [1, 4096, 1, 77]> input_87_cast_fp16 = mul(x = w_59_to_fp16, y = hidden_states_59_cast_fp16)[name = tensor<string, []>("input_87_cast_fp16")];
            tensor<int32, [2]> var_2190 = const()[name = tensor<string, []>("op_2190"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2192 = const()[name = tensor<string, []>("op_2192"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_31_pad_type_0 = const()[name = tensor<string, []>("x_31_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_31_pad_0 = const()[name = tensor<string, []>("x_31_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_14_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_14_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5800715968)))];
            tensor<fp16, [1, 10240, 1, 77]> x_31_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2192, groups = var_2083, pad = x_31_pad_0, pad_type = x_31_pad_type_0, strides = var_2190, weight = block_14_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_87_cast_fp16)[name = tensor<string, []>("x_31_cast_fp16")];
            tensor<string, []> var_2206_mode_0 = const()[name = tensor<string, []>("op_2206_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_2206_cast_fp16 = gelu(mode = var_2206_mode_0, x = x_31_cast_fp16)[name = tensor<string, []>("op_2206_cast_fp16")];
            tensor<int32, [2]> var_2209 = const()[name = tensor<string, []>("op_2209"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2211 = const()[name = tensor<string, []>("op_2211"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2213_pad_type_0 = const()[name = tensor<string, []>("op_2213_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2213_pad_0 = const()[name = tensor<string, []>("op_2213_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_14_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_14_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5884602112)))];
            tensor<fp16, [1, 10240, 1, 77]> var_2213_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2211, groups = var_2083, pad = var_2213_pad_0, pad_type = var_2213_pad_type_0, strides = var_2209, weight = block_14_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_87_cast_fp16)[name = tensor<string, []>("op_2213_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_89_cast_fp16 = mul(x = var_2206_cast_fp16, y = var_2213_cast_fp16)[name = tensor<string, []>("input_89_cast_fp16")];
            tensor<int32, [2]> var_2217 = const()[name = tensor<string, []>("op_2217"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2219 = const()[name = tensor<string, []>("op_2219"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2221_pad_type_0 = const()[name = tensor<string, []>("op_2221_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2221_pad_0 = const()[name = tensor<string, []>("op_2221_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_14_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_14_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5968488256)))];
            tensor<fp16, [1, 4096, 1, 77]> var_2221_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2219, groups = var_2083, pad = var_2221_pad_0, pad_type = var_2221_pad_type_0, strides = var_2217, weight = block_14_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_89_cast_fp16)[name = tensor<string, []>("op_2221_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_121_cast_fp16 = add(x = inputs_119_cast_fp16, y = var_2221_cast_fp16)[name = tensor<string, []>("inputs_121_cast_fp16")];
            tensor<bool, []> var_2226 = const()[name = tensor<string, []>("op_2226"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_2227 = const()[name = tensor<string, []>("op_2227"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_2231 = const()[name = tensor<string, []>("op_2231"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_2229_to_fp16 = const()[name = tensor<string, []>("op_2229_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_2228_to_fp16 = const()[name = tensor<string, []>("op_2228_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_123_cast_fp16 = clip(alpha = var_2229_to_fp16, beta = var_2228_to_fp16, x = inputs_121_cast_fp16)[name = tensor<string, []>("inputs_123_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_61_cast_fp16 = mul(x = inputs_123_cast_fp16, y = inputs_123_cast_fp16)[name = tensor<string, []>("inputs_sq_61_cast_fp16")];
            tensor<int32, [1]> var_2248 = const()[name = tensor<string, []>("op_2248"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_61_cast_fp16 = reduce_mean(axes = var_2248, keep_dims = var_2226, x = inputs_sq_61_cast_fp16)[name = tensor<string, []>("variance_61_cast_fp16")];
            tensor<fp16, []> var_2250_to_fp16 = const()[name = tensor<string, []>("op_2250_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2251_cast_fp16 = add(x = variance_61_cast_fp16, y = var_2250_to_fp16)[name = tensor<string, []>("op_2251_cast_fp16")];
            tensor<fp16, []> var_2252_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2252_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2252_cast_fp16 = rsqrt(epsilon = var_2252_epsilon_0_to_fp16, x = var_2251_cast_fp16)[name = tensor<string, []>("op_2252_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_61_cast_fp16 = mul(x = inputs_123_cast_fp16, y = var_2252_cast_fp16)[name = tensor<string, []>("hidden_states_61_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_61_to_fp16 = const()[name = tensor<string, []>("w_61_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6052374400)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_63_cast_fp16 = mul(x = w_61_to_fp16, y = hidden_states_61_cast_fp16)[name = tensor<string, []>("obj_63_cast_fp16")];
            tensor<int32, [2]> var_2266 = const()[name = tensor<string, []>("op_2266"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2268 = const()[name = tensor<string, []>("op_2268"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_31_pad_type_0 = const()[name = tensor<string, []>("query_31_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_31_pad_0 = const()[name = tensor<string, []>("query_31_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_15_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_15_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6052382656)))];
            tensor<fp16, [1, 4096, 1, 77]> query_31_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2268, groups = var_2227, pad = query_31_pad_0, pad_type = query_31_pad_type_0, strides = var_2266, weight = block_15_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_63_cast_fp16)[name = tensor<string, []>("query_31_cast_fp16")];
            tensor<int32, [2]> var_2272 = const()[name = tensor<string, []>("op_2272"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2274 = const()[name = tensor<string, []>("op_2274"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_31_pad_type_0 = const()[name = tensor<string, []>("key_31_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_31_pad_0 = const()[name = tensor<string, []>("key_31_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_15_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_15_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6085937152)))];
            tensor<fp16, [1, 4096, 1, 77]> key_31_cast_fp16 = conv(dilations = var_2274, groups = var_2227, pad = key_31_pad_0, pad_type = key_31_pad_type_0, strides = var_2272, weight = block_15_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_63_cast_fp16)[name = tensor<string, []>("key_31_cast_fp16")];
            tensor<int32, [2]> var_2279 = const()[name = tensor<string, []>("op_2279"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2281 = const()[name = tensor<string, []>("op_2281"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_31_pad_type_0 = const()[name = tensor<string, []>("value_31_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_31_pad_0 = const()[name = tensor<string, []>("value_31_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_15_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_15_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6119491648)))];
            tensor<fp16, [1, 4096, 1, 77]> value_31_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2281, groups = var_2227, pad = value_31_pad_0, pad_type = value_31_pad_type_0, strides = var_2279, weight = block_15_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_63_cast_fp16)[name = tensor<string, []>("value_31_cast_fp16")];
            tensor<int32, [4]> var_2285 = const()[name = tensor<string, []>("op_2285"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2286_cast_fp16 = reshape(shape = var_2285, x = query_31_cast_fp16)[name = tensor<string, []>("op_2286_cast_fp16")];
            tensor<int32, [4]> var_2287 = const()[name = tensor<string, []>("op_2287"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2288_cast_fp16 = reshape(shape = var_2287, x = key_31_cast_fp16)[name = tensor<string, []>("op_2288_cast_fp16")];
            tensor<bool, []> mh_w_91_transpose_x_0 = const()[name = tensor<string, []>("mh_w_91_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_91_transpose_y_0 = const()[name = tensor<string, []>("mh_w_91_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_91_cast_fp16 = matmul(transpose_x = mh_w_91_transpose_x_0, transpose_y = mh_w_91_transpose_y_0, x = var_2286_cast_fp16, y = var_2288_cast_fp16)[name = tensor<string, []>("mh_w_91_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_93_cast_fp16 = add(x = mh_w_91_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_93_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_95_cast_fp16 = add(x = mh_w_93_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_95_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_2297_cast_fp16 = softmax(axis = var_2231, x = mh_w_95_cast_fp16)[name = tensor<string, []>("op_2297_cast_fp16")];
            tensor<int32, [4]> var_2298 = const()[name = tensor<string, []>("op_2298"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2299_cast_fp16 = reshape(shape = var_2298, x = value_31_cast_fp16)[name = tensor<string, []>("op_2299_cast_fp16")];
            tensor<bool, []> attn_31_transpose_x_0 = const()[name = tensor<string, []>("attn_31_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_31_transpose_y_0 = const()[name = tensor<string, []>("attn_31_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_31_cast_fp16 = matmul(transpose_x = attn_31_transpose_x_0, transpose_y = attn_31_transpose_y_0, x = var_2299_cast_fp16, y = var_2297_cast_fp16)[name = tensor<string, []>("attn_31_cast_fp16")];
            tensor<int32, [4]> var_2302 = const()[name = tensor<string, []>("op_2302"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_91_cast_fp16 = reshape(shape = var_2302, x = attn_31_cast_fp16)[name = tensor<string, []>("input_91_cast_fp16")];
            tensor<int32, [2]> var_2306 = const()[name = tensor<string, []>("op_2306"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2308 = const()[name = tensor<string, []>("op_2308"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_65_pad_type_0 = const()[name = tensor<string, []>("obj_65_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_65_pad_0 = const()[name = tensor<string, []>("obj_65_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_15_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_15_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6153046144)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_65_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2308, groups = var_2227, pad = obj_65_pad_0, pad_type = obj_65_pad_type_0, strides = var_2306, weight = block_15_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_91_cast_fp16)[name = tensor<string, []>("obj_65_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_125_cast_fp16 = add(x = inputs_123_cast_fp16, y = obj_65_cast_fp16)[name = tensor<string, []>("inputs_125_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_127_cast_fp16 = clip(alpha = var_2229_to_fp16, beta = var_2228_to_fp16, x = inputs_125_cast_fp16)[name = tensor<string, []>("inputs_127_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_63_cast_fp16 = mul(x = inputs_127_cast_fp16, y = inputs_127_cast_fp16)[name = tensor<string, []>("inputs_sq_63_cast_fp16")];
            tensor<int32, [1]> var_2317 = const()[name = tensor<string, []>("op_2317"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_63_cast_fp16 = reduce_mean(axes = var_2317, keep_dims = var_2226, x = inputs_sq_63_cast_fp16)[name = tensor<string, []>("variance_63_cast_fp16")];
            tensor<fp16, []> var_2319_to_fp16 = const()[name = tensor<string, []>("op_2319_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2320_cast_fp16 = add(x = variance_63_cast_fp16, y = var_2319_to_fp16)[name = tensor<string, []>("op_2320_cast_fp16")];
            tensor<fp16, []> var_2321_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2321_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2321_cast_fp16 = rsqrt(epsilon = var_2321_epsilon_0_to_fp16, x = var_2320_cast_fp16)[name = tensor<string, []>("op_2321_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_63_cast_fp16 = mul(x = inputs_127_cast_fp16, y = var_2321_cast_fp16)[name = tensor<string, []>("hidden_states_63_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_63_to_fp16 = const()[name = tensor<string, []>("w_63_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6186600640)))];
            tensor<fp16, [1, 4096, 1, 77]> input_93_cast_fp16 = mul(x = w_63_to_fp16, y = hidden_states_63_cast_fp16)[name = tensor<string, []>("input_93_cast_fp16")];
            tensor<int32, [2]> var_2334 = const()[name = tensor<string, []>("op_2334"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2336 = const()[name = tensor<string, []>("op_2336"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_33_pad_type_0 = const()[name = tensor<string, []>("x_33_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_33_pad_0 = const()[name = tensor<string, []>("x_33_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_15_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_15_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6186608896)))];
            tensor<fp16, [1, 10240, 1, 77]> x_33_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2336, groups = var_2227, pad = x_33_pad_0, pad_type = x_33_pad_type_0, strides = var_2334, weight = block_15_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_93_cast_fp16)[name = tensor<string, []>("x_33_cast_fp16")];
            tensor<string, []> var_2350_mode_0 = const()[name = tensor<string, []>("op_2350_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_2350_cast_fp16 = gelu(mode = var_2350_mode_0, x = x_33_cast_fp16)[name = tensor<string, []>("op_2350_cast_fp16")];
            tensor<int32, [2]> var_2353 = const()[name = tensor<string, []>("op_2353"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2355 = const()[name = tensor<string, []>("op_2355"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2357_pad_type_0 = const()[name = tensor<string, []>("op_2357_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2357_pad_0 = const()[name = tensor<string, []>("op_2357_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_15_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_15_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6270495040)))];
            tensor<fp16, [1, 10240, 1, 77]> var_2357_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2355, groups = var_2227, pad = var_2357_pad_0, pad_type = var_2357_pad_type_0, strides = var_2353, weight = block_15_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_93_cast_fp16)[name = tensor<string, []>("op_2357_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_95_cast_fp16 = mul(x = var_2350_cast_fp16, y = var_2357_cast_fp16)[name = tensor<string, []>("input_95_cast_fp16")];
            tensor<int32, [2]> var_2361 = const()[name = tensor<string, []>("op_2361"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2363 = const()[name = tensor<string, []>("op_2363"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2365_pad_type_0 = const()[name = tensor<string, []>("op_2365_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2365_pad_0 = const()[name = tensor<string, []>("op_2365_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_15_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_15_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6354381184)))];
            tensor<fp16, [1, 4096, 1, 77]> var_2365_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2363, groups = var_2227, pad = var_2365_pad_0, pad_type = var_2365_pad_type_0, strides = var_2361, weight = block_15_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_95_cast_fp16)[name = tensor<string, []>("op_2365_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_129_cast_fp16 = add(x = inputs_127_cast_fp16, y = var_2365_cast_fp16)[name = tensor<string, []>("inputs_129_cast_fp16")];
            tensor<bool, []> var_2370 = const()[name = tensor<string, []>("op_2370"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_2371 = const()[name = tensor<string, []>("op_2371"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_2375 = const()[name = tensor<string, []>("op_2375"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_2373_to_fp16 = const()[name = tensor<string, []>("op_2373_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_2372_to_fp16 = const()[name = tensor<string, []>("op_2372_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_131_cast_fp16 = clip(alpha = var_2373_to_fp16, beta = var_2372_to_fp16, x = inputs_129_cast_fp16)[name = tensor<string, []>("inputs_131_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_65_cast_fp16 = mul(x = inputs_131_cast_fp16, y = inputs_131_cast_fp16)[name = tensor<string, []>("inputs_sq_65_cast_fp16")];
            tensor<int32, [1]> var_2392 = const()[name = tensor<string, []>("op_2392"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_65_cast_fp16 = reduce_mean(axes = var_2392, keep_dims = var_2370, x = inputs_sq_65_cast_fp16)[name = tensor<string, []>("variance_65_cast_fp16")];
            tensor<fp16, []> var_2394_to_fp16 = const()[name = tensor<string, []>("op_2394_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2395_cast_fp16 = add(x = variance_65_cast_fp16, y = var_2394_to_fp16)[name = tensor<string, []>("op_2395_cast_fp16")];
            tensor<fp16, []> var_2396_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2396_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2396_cast_fp16 = rsqrt(epsilon = var_2396_epsilon_0_to_fp16, x = var_2395_cast_fp16)[name = tensor<string, []>("op_2396_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_65_cast_fp16 = mul(x = inputs_131_cast_fp16, y = var_2396_cast_fp16)[name = tensor<string, []>("hidden_states_65_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_65_to_fp16 = const()[name = tensor<string, []>("w_65_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6438267328)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_67_cast_fp16 = mul(x = w_65_to_fp16, y = hidden_states_65_cast_fp16)[name = tensor<string, []>("obj_67_cast_fp16")];
            tensor<int32, [2]> var_2410 = const()[name = tensor<string, []>("op_2410"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2412 = const()[name = tensor<string, []>("op_2412"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_33_pad_type_0 = const()[name = tensor<string, []>("query_33_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_33_pad_0 = const()[name = tensor<string, []>("query_33_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_16_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_16_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6438275584)))];
            tensor<fp16, [1, 4096, 1, 77]> query_33_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2412, groups = var_2371, pad = query_33_pad_0, pad_type = query_33_pad_type_0, strides = var_2410, weight = block_16_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_67_cast_fp16)[name = tensor<string, []>("query_33_cast_fp16")];
            tensor<int32, [2]> var_2416 = const()[name = tensor<string, []>("op_2416"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2418 = const()[name = tensor<string, []>("op_2418"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_33_pad_type_0 = const()[name = tensor<string, []>("key_33_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_33_pad_0 = const()[name = tensor<string, []>("key_33_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_16_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_16_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6471830080)))];
            tensor<fp16, [1, 4096, 1, 77]> key_33_cast_fp16 = conv(dilations = var_2418, groups = var_2371, pad = key_33_pad_0, pad_type = key_33_pad_type_0, strides = var_2416, weight = block_16_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_67_cast_fp16)[name = tensor<string, []>("key_33_cast_fp16")];
            tensor<int32, [2]> var_2423 = const()[name = tensor<string, []>("op_2423"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2425 = const()[name = tensor<string, []>("op_2425"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_33_pad_type_0 = const()[name = tensor<string, []>("value_33_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_33_pad_0 = const()[name = tensor<string, []>("value_33_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_16_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_16_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6505384576)))];
            tensor<fp16, [1, 4096, 1, 77]> value_33_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2425, groups = var_2371, pad = value_33_pad_0, pad_type = value_33_pad_type_0, strides = var_2423, weight = block_16_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_67_cast_fp16)[name = tensor<string, []>("value_33_cast_fp16")];
            tensor<int32, [4]> var_2429 = const()[name = tensor<string, []>("op_2429"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2430_cast_fp16 = reshape(shape = var_2429, x = query_33_cast_fp16)[name = tensor<string, []>("op_2430_cast_fp16")];
            tensor<int32, [4]> var_2431 = const()[name = tensor<string, []>("op_2431"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2432_cast_fp16 = reshape(shape = var_2431, x = key_33_cast_fp16)[name = tensor<string, []>("op_2432_cast_fp16")];
            tensor<bool, []> mh_w_97_transpose_x_0 = const()[name = tensor<string, []>("mh_w_97_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_97_transpose_y_0 = const()[name = tensor<string, []>("mh_w_97_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_97_cast_fp16 = matmul(transpose_x = mh_w_97_transpose_x_0, transpose_y = mh_w_97_transpose_y_0, x = var_2430_cast_fp16, y = var_2432_cast_fp16)[name = tensor<string, []>("mh_w_97_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_99_cast_fp16 = add(x = mh_w_97_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_99_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_101_cast_fp16 = add(x = mh_w_99_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_101_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_2441_cast_fp16 = softmax(axis = var_2375, x = mh_w_101_cast_fp16)[name = tensor<string, []>("op_2441_cast_fp16")];
            tensor<int32, [4]> var_2442 = const()[name = tensor<string, []>("op_2442"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2443_cast_fp16 = reshape(shape = var_2442, x = value_33_cast_fp16)[name = tensor<string, []>("op_2443_cast_fp16")];
            tensor<bool, []> attn_33_transpose_x_0 = const()[name = tensor<string, []>("attn_33_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_33_transpose_y_0 = const()[name = tensor<string, []>("attn_33_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_33_cast_fp16 = matmul(transpose_x = attn_33_transpose_x_0, transpose_y = attn_33_transpose_y_0, x = var_2443_cast_fp16, y = var_2441_cast_fp16)[name = tensor<string, []>("attn_33_cast_fp16")];
            tensor<int32, [4]> var_2446 = const()[name = tensor<string, []>("op_2446"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_97_cast_fp16 = reshape(shape = var_2446, x = attn_33_cast_fp16)[name = tensor<string, []>("input_97_cast_fp16")];
            tensor<int32, [2]> var_2450 = const()[name = tensor<string, []>("op_2450"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2452 = const()[name = tensor<string, []>("op_2452"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_69_pad_type_0 = const()[name = tensor<string, []>("obj_69_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_69_pad_0 = const()[name = tensor<string, []>("obj_69_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_16_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_16_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6538939072)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_69_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2452, groups = var_2371, pad = obj_69_pad_0, pad_type = obj_69_pad_type_0, strides = var_2450, weight = block_16_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_97_cast_fp16)[name = tensor<string, []>("obj_69_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_133_cast_fp16 = add(x = inputs_131_cast_fp16, y = obj_69_cast_fp16)[name = tensor<string, []>("inputs_133_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_135_cast_fp16 = clip(alpha = var_2373_to_fp16, beta = var_2372_to_fp16, x = inputs_133_cast_fp16)[name = tensor<string, []>("inputs_135_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_67_cast_fp16 = mul(x = inputs_135_cast_fp16, y = inputs_135_cast_fp16)[name = tensor<string, []>("inputs_sq_67_cast_fp16")];
            tensor<int32, [1]> var_2461 = const()[name = tensor<string, []>("op_2461"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_67_cast_fp16 = reduce_mean(axes = var_2461, keep_dims = var_2370, x = inputs_sq_67_cast_fp16)[name = tensor<string, []>("variance_67_cast_fp16")];
            tensor<fp16, []> var_2463_to_fp16 = const()[name = tensor<string, []>("op_2463_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2464_cast_fp16 = add(x = variance_67_cast_fp16, y = var_2463_to_fp16)[name = tensor<string, []>("op_2464_cast_fp16")];
            tensor<fp16, []> var_2465_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2465_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2465_cast_fp16 = rsqrt(epsilon = var_2465_epsilon_0_to_fp16, x = var_2464_cast_fp16)[name = tensor<string, []>("op_2465_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_67_cast_fp16 = mul(x = inputs_135_cast_fp16, y = var_2465_cast_fp16)[name = tensor<string, []>("hidden_states_67_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_67_to_fp16 = const()[name = tensor<string, []>("w_67_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6572493568)))];
            tensor<fp16, [1, 4096, 1, 77]> input_99_cast_fp16 = mul(x = w_67_to_fp16, y = hidden_states_67_cast_fp16)[name = tensor<string, []>("input_99_cast_fp16")];
            tensor<int32, [2]> var_2478 = const()[name = tensor<string, []>("op_2478"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2480 = const()[name = tensor<string, []>("op_2480"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_35_pad_type_0 = const()[name = tensor<string, []>("x_35_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_35_pad_0 = const()[name = tensor<string, []>("x_35_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_16_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_16_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6572501824)))];
            tensor<fp16, [1, 10240, 1, 77]> x_35_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2480, groups = var_2371, pad = x_35_pad_0, pad_type = x_35_pad_type_0, strides = var_2478, weight = block_16_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_99_cast_fp16)[name = tensor<string, []>("x_35_cast_fp16")];
            tensor<string, []> var_2494_mode_0 = const()[name = tensor<string, []>("op_2494_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_2494_cast_fp16 = gelu(mode = var_2494_mode_0, x = x_35_cast_fp16)[name = tensor<string, []>("op_2494_cast_fp16")];
            tensor<int32, [2]> var_2497 = const()[name = tensor<string, []>("op_2497"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2499 = const()[name = tensor<string, []>("op_2499"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2501_pad_type_0 = const()[name = tensor<string, []>("op_2501_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2501_pad_0 = const()[name = tensor<string, []>("op_2501_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_16_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_16_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6656387968)))];
            tensor<fp16, [1, 10240, 1, 77]> var_2501_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2499, groups = var_2371, pad = var_2501_pad_0, pad_type = var_2501_pad_type_0, strides = var_2497, weight = block_16_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_99_cast_fp16)[name = tensor<string, []>("op_2501_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_101_cast_fp16 = mul(x = var_2494_cast_fp16, y = var_2501_cast_fp16)[name = tensor<string, []>("input_101_cast_fp16")];
            tensor<int32, [2]> var_2505 = const()[name = tensor<string, []>("op_2505"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2507 = const()[name = tensor<string, []>("op_2507"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2509_pad_type_0 = const()[name = tensor<string, []>("op_2509_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2509_pad_0 = const()[name = tensor<string, []>("op_2509_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_16_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_16_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6740274112)))];
            tensor<fp16, [1, 4096, 1, 77]> var_2509_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2507, groups = var_2371, pad = var_2509_pad_0, pad_type = var_2509_pad_type_0, strides = var_2505, weight = block_16_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_101_cast_fp16)[name = tensor<string, []>("op_2509_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_137_cast_fp16 = add(x = inputs_135_cast_fp16, y = var_2509_cast_fp16)[name = tensor<string, []>("inputs_137_cast_fp16")];
            tensor<bool, []> var_2514 = const()[name = tensor<string, []>("op_2514"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_2515 = const()[name = tensor<string, []>("op_2515"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_2519 = const()[name = tensor<string, []>("op_2519"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_2517_to_fp16 = const()[name = tensor<string, []>("op_2517_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_2516_to_fp16 = const()[name = tensor<string, []>("op_2516_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_139_cast_fp16 = clip(alpha = var_2517_to_fp16, beta = var_2516_to_fp16, x = inputs_137_cast_fp16)[name = tensor<string, []>("inputs_139_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_69_cast_fp16 = mul(x = inputs_139_cast_fp16, y = inputs_139_cast_fp16)[name = tensor<string, []>("inputs_sq_69_cast_fp16")];
            tensor<int32, [1]> var_2536 = const()[name = tensor<string, []>("op_2536"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_69_cast_fp16 = reduce_mean(axes = var_2536, keep_dims = var_2514, x = inputs_sq_69_cast_fp16)[name = tensor<string, []>("variance_69_cast_fp16")];
            tensor<fp16, []> var_2538_to_fp16 = const()[name = tensor<string, []>("op_2538_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2539_cast_fp16 = add(x = variance_69_cast_fp16, y = var_2538_to_fp16)[name = tensor<string, []>("op_2539_cast_fp16")];
            tensor<fp16, []> var_2540_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2540_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2540_cast_fp16 = rsqrt(epsilon = var_2540_epsilon_0_to_fp16, x = var_2539_cast_fp16)[name = tensor<string, []>("op_2540_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_69_cast_fp16 = mul(x = inputs_139_cast_fp16, y = var_2540_cast_fp16)[name = tensor<string, []>("hidden_states_69_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_69_to_fp16 = const()[name = tensor<string, []>("w_69_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6824160256)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_71_cast_fp16 = mul(x = w_69_to_fp16, y = hidden_states_69_cast_fp16)[name = tensor<string, []>("obj_71_cast_fp16")];
            tensor<int32, [2]> var_2554 = const()[name = tensor<string, []>("op_2554"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2556 = const()[name = tensor<string, []>("op_2556"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_35_pad_type_0 = const()[name = tensor<string, []>("query_35_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_35_pad_0 = const()[name = tensor<string, []>("query_35_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_17_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_17_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6824168512)))];
            tensor<fp16, [1, 4096, 1, 77]> query_35_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2556, groups = var_2515, pad = query_35_pad_0, pad_type = query_35_pad_type_0, strides = var_2554, weight = block_17_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_71_cast_fp16)[name = tensor<string, []>("query_35_cast_fp16")];
            tensor<int32, [2]> var_2560 = const()[name = tensor<string, []>("op_2560"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2562 = const()[name = tensor<string, []>("op_2562"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_35_pad_type_0 = const()[name = tensor<string, []>("key_35_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_35_pad_0 = const()[name = tensor<string, []>("key_35_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_17_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_17_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6857723008)))];
            tensor<fp16, [1, 4096, 1, 77]> key_35_cast_fp16 = conv(dilations = var_2562, groups = var_2515, pad = key_35_pad_0, pad_type = key_35_pad_type_0, strides = var_2560, weight = block_17_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_71_cast_fp16)[name = tensor<string, []>("key_35_cast_fp16")];
            tensor<int32, [2]> var_2567 = const()[name = tensor<string, []>("op_2567"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2569 = const()[name = tensor<string, []>("op_2569"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_35_pad_type_0 = const()[name = tensor<string, []>("value_35_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_35_pad_0 = const()[name = tensor<string, []>("value_35_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_17_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_17_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6891277504)))];
            tensor<fp16, [1, 4096, 1, 77]> value_35_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2569, groups = var_2515, pad = value_35_pad_0, pad_type = value_35_pad_type_0, strides = var_2567, weight = block_17_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_71_cast_fp16)[name = tensor<string, []>("value_35_cast_fp16")];
            tensor<int32, [4]> var_2573 = const()[name = tensor<string, []>("op_2573"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2574_cast_fp16 = reshape(shape = var_2573, x = query_35_cast_fp16)[name = tensor<string, []>("op_2574_cast_fp16")];
            tensor<int32, [4]> var_2575 = const()[name = tensor<string, []>("op_2575"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2576_cast_fp16 = reshape(shape = var_2575, x = key_35_cast_fp16)[name = tensor<string, []>("op_2576_cast_fp16")];
            tensor<bool, []> mh_w_103_transpose_x_0 = const()[name = tensor<string, []>("mh_w_103_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_103_transpose_y_0 = const()[name = tensor<string, []>("mh_w_103_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_103_cast_fp16 = matmul(transpose_x = mh_w_103_transpose_x_0, transpose_y = mh_w_103_transpose_y_0, x = var_2574_cast_fp16, y = var_2576_cast_fp16)[name = tensor<string, []>("mh_w_103_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_105_cast_fp16 = add(x = mh_w_103_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_105_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_107_cast_fp16 = add(x = mh_w_105_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_107_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_2585_cast_fp16 = softmax(axis = var_2519, x = mh_w_107_cast_fp16)[name = tensor<string, []>("op_2585_cast_fp16")];
            tensor<int32, [4]> var_2586 = const()[name = tensor<string, []>("op_2586"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2587_cast_fp16 = reshape(shape = var_2586, x = value_35_cast_fp16)[name = tensor<string, []>("op_2587_cast_fp16")];
            tensor<bool, []> attn_35_transpose_x_0 = const()[name = tensor<string, []>("attn_35_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_35_transpose_y_0 = const()[name = tensor<string, []>("attn_35_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_35_cast_fp16 = matmul(transpose_x = attn_35_transpose_x_0, transpose_y = attn_35_transpose_y_0, x = var_2587_cast_fp16, y = var_2585_cast_fp16)[name = tensor<string, []>("attn_35_cast_fp16")];
            tensor<int32, [4]> var_2590 = const()[name = tensor<string, []>("op_2590"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_103_cast_fp16 = reshape(shape = var_2590, x = attn_35_cast_fp16)[name = tensor<string, []>("input_103_cast_fp16")];
            tensor<int32, [2]> var_2594 = const()[name = tensor<string, []>("op_2594"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2596 = const()[name = tensor<string, []>("op_2596"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_73_pad_type_0 = const()[name = tensor<string, []>("obj_73_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_73_pad_0 = const()[name = tensor<string, []>("obj_73_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_17_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_17_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6924832000)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_73_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2596, groups = var_2515, pad = obj_73_pad_0, pad_type = obj_73_pad_type_0, strides = var_2594, weight = block_17_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_103_cast_fp16)[name = tensor<string, []>("obj_73_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_141_cast_fp16 = add(x = inputs_139_cast_fp16, y = obj_73_cast_fp16)[name = tensor<string, []>("inputs_141_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_143_cast_fp16 = clip(alpha = var_2517_to_fp16, beta = var_2516_to_fp16, x = inputs_141_cast_fp16)[name = tensor<string, []>("inputs_143_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_71_cast_fp16 = mul(x = inputs_143_cast_fp16, y = inputs_143_cast_fp16)[name = tensor<string, []>("inputs_sq_71_cast_fp16")];
            tensor<int32, [1]> var_2605 = const()[name = tensor<string, []>("op_2605"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_71_cast_fp16 = reduce_mean(axes = var_2605, keep_dims = var_2514, x = inputs_sq_71_cast_fp16)[name = tensor<string, []>("variance_71_cast_fp16")];
            tensor<fp16, []> var_2607_to_fp16 = const()[name = tensor<string, []>("op_2607_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2608_cast_fp16 = add(x = variance_71_cast_fp16, y = var_2607_to_fp16)[name = tensor<string, []>("op_2608_cast_fp16")];
            tensor<fp16, []> var_2609_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2609_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2609_cast_fp16 = rsqrt(epsilon = var_2609_epsilon_0_to_fp16, x = var_2608_cast_fp16)[name = tensor<string, []>("op_2609_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_71_cast_fp16 = mul(x = inputs_143_cast_fp16, y = var_2609_cast_fp16)[name = tensor<string, []>("hidden_states_71_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_71_to_fp16 = const()[name = tensor<string, []>("w_71_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6958386496)))];
            tensor<fp16, [1, 4096, 1, 77]> input_105_cast_fp16 = mul(x = w_71_to_fp16, y = hidden_states_71_cast_fp16)[name = tensor<string, []>("input_105_cast_fp16")];
            tensor<int32, [2]> var_2622 = const()[name = tensor<string, []>("op_2622"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2624 = const()[name = tensor<string, []>("op_2624"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_37_pad_type_0 = const()[name = tensor<string, []>("x_37_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_37_pad_0 = const()[name = tensor<string, []>("x_37_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_17_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_17_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(6958394752)))];
            tensor<fp16, [1, 10240, 1, 77]> x_37_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2624, groups = var_2515, pad = x_37_pad_0, pad_type = x_37_pad_type_0, strides = var_2622, weight = block_17_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_105_cast_fp16)[name = tensor<string, []>("x_37_cast_fp16")];
            tensor<string, []> var_2638_mode_0 = const()[name = tensor<string, []>("op_2638_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_2638_cast_fp16 = gelu(mode = var_2638_mode_0, x = x_37_cast_fp16)[name = tensor<string, []>("op_2638_cast_fp16")];
            tensor<int32, [2]> var_2641 = const()[name = tensor<string, []>("op_2641"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2643 = const()[name = tensor<string, []>("op_2643"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2645_pad_type_0 = const()[name = tensor<string, []>("op_2645_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2645_pad_0 = const()[name = tensor<string, []>("op_2645_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_17_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_17_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7042280896)))];
            tensor<fp16, [1, 10240, 1, 77]> var_2645_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2643, groups = var_2515, pad = var_2645_pad_0, pad_type = var_2645_pad_type_0, strides = var_2641, weight = block_17_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_105_cast_fp16)[name = tensor<string, []>("op_2645_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_107_cast_fp16 = mul(x = var_2638_cast_fp16, y = var_2645_cast_fp16)[name = tensor<string, []>("input_107_cast_fp16")];
            tensor<int32, [2]> var_2649 = const()[name = tensor<string, []>("op_2649"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2651 = const()[name = tensor<string, []>("op_2651"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2653_pad_type_0 = const()[name = tensor<string, []>("op_2653_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2653_pad_0 = const()[name = tensor<string, []>("op_2653_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_17_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_17_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7126167040)))];
            tensor<fp16, [1, 4096, 1, 77]> var_2653_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2651, groups = var_2515, pad = var_2653_pad_0, pad_type = var_2653_pad_type_0, strides = var_2649, weight = block_17_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_107_cast_fp16)[name = tensor<string, []>("op_2653_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_145_cast_fp16 = add(x = inputs_143_cast_fp16, y = var_2653_cast_fp16)[name = tensor<string, []>("inputs_145_cast_fp16")];
            tensor<bool, []> var_2658 = const()[name = tensor<string, []>("op_2658"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_2659 = const()[name = tensor<string, []>("op_2659"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_2663 = const()[name = tensor<string, []>("op_2663"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_2661_to_fp16 = const()[name = tensor<string, []>("op_2661_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_2660_to_fp16 = const()[name = tensor<string, []>("op_2660_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_147_cast_fp16 = clip(alpha = var_2661_to_fp16, beta = var_2660_to_fp16, x = inputs_145_cast_fp16)[name = tensor<string, []>("inputs_147_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_73_cast_fp16 = mul(x = inputs_147_cast_fp16, y = inputs_147_cast_fp16)[name = tensor<string, []>("inputs_sq_73_cast_fp16")];
            tensor<int32, [1]> var_2680 = const()[name = tensor<string, []>("op_2680"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_73_cast_fp16 = reduce_mean(axes = var_2680, keep_dims = var_2658, x = inputs_sq_73_cast_fp16)[name = tensor<string, []>("variance_73_cast_fp16")];
            tensor<fp16, []> var_2682_to_fp16 = const()[name = tensor<string, []>("op_2682_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2683_cast_fp16 = add(x = variance_73_cast_fp16, y = var_2682_to_fp16)[name = tensor<string, []>("op_2683_cast_fp16")];
            tensor<fp16, []> var_2684_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2684_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2684_cast_fp16 = rsqrt(epsilon = var_2684_epsilon_0_to_fp16, x = var_2683_cast_fp16)[name = tensor<string, []>("op_2684_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_73_cast_fp16 = mul(x = inputs_147_cast_fp16, y = var_2684_cast_fp16)[name = tensor<string, []>("hidden_states_73_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_73_to_fp16 = const()[name = tensor<string, []>("w_73_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7210053184)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_75_cast_fp16 = mul(x = w_73_to_fp16, y = hidden_states_73_cast_fp16)[name = tensor<string, []>("obj_75_cast_fp16")];
            tensor<int32, [2]> var_2698 = const()[name = tensor<string, []>("op_2698"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2700 = const()[name = tensor<string, []>("op_2700"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_37_pad_type_0 = const()[name = tensor<string, []>("query_37_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_37_pad_0 = const()[name = tensor<string, []>("query_37_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_18_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_18_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7210061440)))];
            tensor<fp16, [1, 4096, 1, 77]> query_37_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2700, groups = var_2659, pad = query_37_pad_0, pad_type = query_37_pad_type_0, strides = var_2698, weight = block_18_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_75_cast_fp16)[name = tensor<string, []>("query_37_cast_fp16")];
            tensor<int32, [2]> var_2704 = const()[name = tensor<string, []>("op_2704"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2706 = const()[name = tensor<string, []>("op_2706"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_37_pad_type_0 = const()[name = tensor<string, []>("key_37_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_37_pad_0 = const()[name = tensor<string, []>("key_37_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_18_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_18_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7243615936)))];
            tensor<fp16, [1, 4096, 1, 77]> key_37_cast_fp16 = conv(dilations = var_2706, groups = var_2659, pad = key_37_pad_0, pad_type = key_37_pad_type_0, strides = var_2704, weight = block_18_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_75_cast_fp16)[name = tensor<string, []>("key_37_cast_fp16")];
            tensor<int32, [2]> var_2711 = const()[name = tensor<string, []>("op_2711"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2713 = const()[name = tensor<string, []>("op_2713"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_37_pad_type_0 = const()[name = tensor<string, []>("value_37_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_37_pad_0 = const()[name = tensor<string, []>("value_37_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_18_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_18_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7277170432)))];
            tensor<fp16, [1, 4096, 1, 77]> value_37_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2713, groups = var_2659, pad = value_37_pad_0, pad_type = value_37_pad_type_0, strides = var_2711, weight = block_18_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_75_cast_fp16)[name = tensor<string, []>("value_37_cast_fp16")];
            tensor<int32, [4]> var_2717 = const()[name = tensor<string, []>("op_2717"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2718_cast_fp16 = reshape(shape = var_2717, x = query_37_cast_fp16)[name = tensor<string, []>("op_2718_cast_fp16")];
            tensor<int32, [4]> var_2719 = const()[name = tensor<string, []>("op_2719"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2720_cast_fp16 = reshape(shape = var_2719, x = key_37_cast_fp16)[name = tensor<string, []>("op_2720_cast_fp16")];
            tensor<bool, []> mh_w_109_transpose_x_0 = const()[name = tensor<string, []>("mh_w_109_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_109_transpose_y_0 = const()[name = tensor<string, []>("mh_w_109_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_109_cast_fp16 = matmul(transpose_x = mh_w_109_transpose_x_0, transpose_y = mh_w_109_transpose_y_0, x = var_2718_cast_fp16, y = var_2720_cast_fp16)[name = tensor<string, []>("mh_w_109_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_111_cast_fp16 = add(x = mh_w_109_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_111_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_113_cast_fp16 = add(x = mh_w_111_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_113_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_2729_cast_fp16 = softmax(axis = var_2663, x = mh_w_113_cast_fp16)[name = tensor<string, []>("op_2729_cast_fp16")];
            tensor<int32, [4]> var_2730 = const()[name = tensor<string, []>("op_2730"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2731_cast_fp16 = reshape(shape = var_2730, x = value_37_cast_fp16)[name = tensor<string, []>("op_2731_cast_fp16")];
            tensor<bool, []> attn_37_transpose_x_0 = const()[name = tensor<string, []>("attn_37_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_37_transpose_y_0 = const()[name = tensor<string, []>("attn_37_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_37_cast_fp16 = matmul(transpose_x = attn_37_transpose_x_0, transpose_y = attn_37_transpose_y_0, x = var_2731_cast_fp16, y = var_2729_cast_fp16)[name = tensor<string, []>("attn_37_cast_fp16")];
            tensor<int32, [4]> var_2734 = const()[name = tensor<string, []>("op_2734"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_109_cast_fp16 = reshape(shape = var_2734, x = attn_37_cast_fp16)[name = tensor<string, []>("input_109_cast_fp16")];
            tensor<int32, [2]> var_2738 = const()[name = tensor<string, []>("op_2738"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2740 = const()[name = tensor<string, []>("op_2740"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_77_pad_type_0 = const()[name = tensor<string, []>("obj_77_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_77_pad_0 = const()[name = tensor<string, []>("obj_77_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_18_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_18_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7310724928)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_77_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2740, groups = var_2659, pad = obj_77_pad_0, pad_type = obj_77_pad_type_0, strides = var_2738, weight = block_18_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_109_cast_fp16)[name = tensor<string, []>("obj_77_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_149_cast_fp16 = add(x = inputs_147_cast_fp16, y = obj_77_cast_fp16)[name = tensor<string, []>("inputs_149_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_151_cast_fp16 = clip(alpha = var_2661_to_fp16, beta = var_2660_to_fp16, x = inputs_149_cast_fp16)[name = tensor<string, []>("inputs_151_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_75_cast_fp16 = mul(x = inputs_151_cast_fp16, y = inputs_151_cast_fp16)[name = tensor<string, []>("inputs_sq_75_cast_fp16")];
            tensor<int32, [1]> var_2749 = const()[name = tensor<string, []>("op_2749"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_75_cast_fp16 = reduce_mean(axes = var_2749, keep_dims = var_2658, x = inputs_sq_75_cast_fp16)[name = tensor<string, []>("variance_75_cast_fp16")];
            tensor<fp16, []> var_2751_to_fp16 = const()[name = tensor<string, []>("op_2751_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2752_cast_fp16 = add(x = variance_75_cast_fp16, y = var_2751_to_fp16)[name = tensor<string, []>("op_2752_cast_fp16")];
            tensor<fp16, []> var_2753_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2753_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2753_cast_fp16 = rsqrt(epsilon = var_2753_epsilon_0_to_fp16, x = var_2752_cast_fp16)[name = tensor<string, []>("op_2753_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_75_cast_fp16 = mul(x = inputs_151_cast_fp16, y = var_2753_cast_fp16)[name = tensor<string, []>("hidden_states_75_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_75_to_fp16 = const()[name = tensor<string, []>("w_75_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7344279424)))];
            tensor<fp16, [1, 4096, 1, 77]> input_111_cast_fp16 = mul(x = w_75_to_fp16, y = hidden_states_75_cast_fp16)[name = tensor<string, []>("input_111_cast_fp16")];
            tensor<int32, [2]> var_2766 = const()[name = tensor<string, []>("op_2766"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2768 = const()[name = tensor<string, []>("op_2768"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_39_pad_type_0 = const()[name = tensor<string, []>("x_39_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_39_pad_0 = const()[name = tensor<string, []>("x_39_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_18_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_18_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7344287680)))];
            tensor<fp16, [1, 10240, 1, 77]> x_39_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2768, groups = var_2659, pad = x_39_pad_0, pad_type = x_39_pad_type_0, strides = var_2766, weight = block_18_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_111_cast_fp16)[name = tensor<string, []>("x_39_cast_fp16")];
            tensor<string, []> var_2782_mode_0 = const()[name = tensor<string, []>("op_2782_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_2782_cast_fp16 = gelu(mode = var_2782_mode_0, x = x_39_cast_fp16)[name = tensor<string, []>("op_2782_cast_fp16")];
            tensor<int32, [2]> var_2785 = const()[name = tensor<string, []>("op_2785"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2787 = const()[name = tensor<string, []>("op_2787"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2789_pad_type_0 = const()[name = tensor<string, []>("op_2789_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2789_pad_0 = const()[name = tensor<string, []>("op_2789_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_18_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_18_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7428173824)))];
            tensor<fp16, [1, 10240, 1, 77]> var_2789_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2787, groups = var_2659, pad = var_2789_pad_0, pad_type = var_2789_pad_type_0, strides = var_2785, weight = block_18_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_111_cast_fp16)[name = tensor<string, []>("op_2789_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_113_cast_fp16 = mul(x = var_2782_cast_fp16, y = var_2789_cast_fp16)[name = tensor<string, []>("input_113_cast_fp16")];
            tensor<int32, [2]> var_2793 = const()[name = tensor<string, []>("op_2793"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2795 = const()[name = tensor<string, []>("op_2795"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2797_pad_type_0 = const()[name = tensor<string, []>("op_2797_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2797_pad_0 = const()[name = tensor<string, []>("op_2797_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_18_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_18_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7512059968)))];
            tensor<fp16, [1, 4096, 1, 77]> var_2797_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2795, groups = var_2659, pad = var_2797_pad_0, pad_type = var_2797_pad_type_0, strides = var_2793, weight = block_18_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_113_cast_fp16)[name = tensor<string, []>("op_2797_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_153_cast_fp16 = add(x = inputs_151_cast_fp16, y = var_2797_cast_fp16)[name = tensor<string, []>("inputs_153_cast_fp16")];
            tensor<bool, []> var_2802 = const()[name = tensor<string, []>("op_2802"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_2803 = const()[name = tensor<string, []>("op_2803"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_2807 = const()[name = tensor<string, []>("op_2807"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_2805_to_fp16 = const()[name = tensor<string, []>("op_2805_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_2804_to_fp16 = const()[name = tensor<string, []>("op_2804_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_155_cast_fp16 = clip(alpha = var_2805_to_fp16, beta = var_2804_to_fp16, x = inputs_153_cast_fp16)[name = tensor<string, []>("inputs_155_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_77_cast_fp16 = mul(x = inputs_155_cast_fp16, y = inputs_155_cast_fp16)[name = tensor<string, []>("inputs_sq_77_cast_fp16")];
            tensor<int32, [1]> var_2824 = const()[name = tensor<string, []>("op_2824"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_77_cast_fp16 = reduce_mean(axes = var_2824, keep_dims = var_2802, x = inputs_sq_77_cast_fp16)[name = tensor<string, []>("variance_77_cast_fp16")];
            tensor<fp16, []> var_2826_to_fp16 = const()[name = tensor<string, []>("op_2826_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2827_cast_fp16 = add(x = variance_77_cast_fp16, y = var_2826_to_fp16)[name = tensor<string, []>("op_2827_cast_fp16")];
            tensor<fp16, []> var_2828_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2828_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2828_cast_fp16 = rsqrt(epsilon = var_2828_epsilon_0_to_fp16, x = var_2827_cast_fp16)[name = tensor<string, []>("op_2828_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_77_cast_fp16 = mul(x = inputs_155_cast_fp16, y = var_2828_cast_fp16)[name = tensor<string, []>("hidden_states_77_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_77_to_fp16 = const()[name = tensor<string, []>("w_77_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7595946112)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_79_cast_fp16 = mul(x = w_77_to_fp16, y = hidden_states_77_cast_fp16)[name = tensor<string, []>("obj_79_cast_fp16")];
            tensor<int32, [2]> var_2842 = const()[name = tensor<string, []>("op_2842"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2844 = const()[name = tensor<string, []>("op_2844"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_39_pad_type_0 = const()[name = tensor<string, []>("query_39_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_39_pad_0 = const()[name = tensor<string, []>("query_39_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_19_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_19_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7595954368)))];
            tensor<fp16, [1, 4096, 1, 77]> query_39_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2844, groups = var_2803, pad = query_39_pad_0, pad_type = query_39_pad_type_0, strides = var_2842, weight = block_19_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_79_cast_fp16)[name = tensor<string, []>("query_39_cast_fp16")];
            tensor<int32, [2]> var_2848 = const()[name = tensor<string, []>("op_2848"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2850 = const()[name = tensor<string, []>("op_2850"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_39_pad_type_0 = const()[name = tensor<string, []>("key_39_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_39_pad_0 = const()[name = tensor<string, []>("key_39_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_19_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_19_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7629508864)))];
            tensor<fp16, [1, 4096, 1, 77]> key_39_cast_fp16 = conv(dilations = var_2850, groups = var_2803, pad = key_39_pad_0, pad_type = key_39_pad_type_0, strides = var_2848, weight = block_19_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_79_cast_fp16)[name = tensor<string, []>("key_39_cast_fp16")];
            tensor<int32, [2]> var_2855 = const()[name = tensor<string, []>("op_2855"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2857 = const()[name = tensor<string, []>("op_2857"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_39_pad_type_0 = const()[name = tensor<string, []>("value_39_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_39_pad_0 = const()[name = tensor<string, []>("value_39_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_19_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_19_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7663063360)))];
            tensor<fp16, [1, 4096, 1, 77]> value_39_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2857, groups = var_2803, pad = value_39_pad_0, pad_type = value_39_pad_type_0, strides = var_2855, weight = block_19_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_79_cast_fp16)[name = tensor<string, []>("value_39_cast_fp16")];
            tensor<int32, [4]> var_2861 = const()[name = tensor<string, []>("op_2861"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2862_cast_fp16 = reshape(shape = var_2861, x = query_39_cast_fp16)[name = tensor<string, []>("op_2862_cast_fp16")];
            tensor<int32, [4]> var_2863 = const()[name = tensor<string, []>("op_2863"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2864_cast_fp16 = reshape(shape = var_2863, x = key_39_cast_fp16)[name = tensor<string, []>("op_2864_cast_fp16")];
            tensor<bool, []> mh_w_115_transpose_x_0 = const()[name = tensor<string, []>("mh_w_115_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_115_transpose_y_0 = const()[name = tensor<string, []>("mh_w_115_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_115_cast_fp16 = matmul(transpose_x = mh_w_115_transpose_x_0, transpose_y = mh_w_115_transpose_y_0, x = var_2862_cast_fp16, y = var_2864_cast_fp16)[name = tensor<string, []>("mh_w_115_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_117_cast_fp16 = add(x = mh_w_115_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_117_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_119_cast_fp16 = add(x = mh_w_117_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_119_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_2873_cast_fp16 = softmax(axis = var_2807, x = mh_w_119_cast_fp16)[name = tensor<string, []>("op_2873_cast_fp16")];
            tensor<int32, [4]> var_2874 = const()[name = tensor<string, []>("op_2874"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_2875_cast_fp16 = reshape(shape = var_2874, x = value_39_cast_fp16)[name = tensor<string, []>("op_2875_cast_fp16")];
            tensor<bool, []> attn_39_transpose_x_0 = const()[name = tensor<string, []>("attn_39_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_39_transpose_y_0 = const()[name = tensor<string, []>("attn_39_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_39_cast_fp16 = matmul(transpose_x = attn_39_transpose_x_0, transpose_y = attn_39_transpose_y_0, x = var_2875_cast_fp16, y = var_2873_cast_fp16)[name = tensor<string, []>("attn_39_cast_fp16")];
            tensor<int32, [4]> var_2878 = const()[name = tensor<string, []>("op_2878"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_115_cast_fp16 = reshape(shape = var_2878, x = attn_39_cast_fp16)[name = tensor<string, []>("input_115_cast_fp16")];
            tensor<int32, [2]> var_2882 = const()[name = tensor<string, []>("op_2882"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2884 = const()[name = tensor<string, []>("op_2884"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_81_pad_type_0 = const()[name = tensor<string, []>("obj_81_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_81_pad_0 = const()[name = tensor<string, []>("obj_81_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_19_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_19_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7696617856)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_81_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2884, groups = var_2803, pad = obj_81_pad_0, pad_type = obj_81_pad_type_0, strides = var_2882, weight = block_19_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_115_cast_fp16)[name = tensor<string, []>("obj_81_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_157_cast_fp16 = add(x = inputs_155_cast_fp16, y = obj_81_cast_fp16)[name = tensor<string, []>("inputs_157_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_159_cast_fp16 = clip(alpha = var_2805_to_fp16, beta = var_2804_to_fp16, x = inputs_157_cast_fp16)[name = tensor<string, []>("inputs_159_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_79_cast_fp16 = mul(x = inputs_159_cast_fp16, y = inputs_159_cast_fp16)[name = tensor<string, []>("inputs_sq_79_cast_fp16")];
            tensor<int32, [1]> var_2893 = const()[name = tensor<string, []>("op_2893"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_79_cast_fp16 = reduce_mean(axes = var_2893, keep_dims = var_2802, x = inputs_sq_79_cast_fp16)[name = tensor<string, []>("variance_79_cast_fp16")];
            tensor<fp16, []> var_2895_to_fp16 = const()[name = tensor<string, []>("op_2895_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2896_cast_fp16 = add(x = variance_79_cast_fp16, y = var_2895_to_fp16)[name = tensor<string, []>("op_2896_cast_fp16")];
            tensor<fp16, []> var_2897_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2897_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2897_cast_fp16 = rsqrt(epsilon = var_2897_epsilon_0_to_fp16, x = var_2896_cast_fp16)[name = tensor<string, []>("op_2897_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_79_cast_fp16 = mul(x = inputs_159_cast_fp16, y = var_2897_cast_fp16)[name = tensor<string, []>("hidden_states_79_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_79_to_fp16 = const()[name = tensor<string, []>("w_79_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7730172352)))];
            tensor<fp16, [1, 4096, 1, 77]> input_117_cast_fp16 = mul(x = w_79_to_fp16, y = hidden_states_79_cast_fp16)[name = tensor<string, []>("input_117_cast_fp16")];
            tensor<int32, [2]> var_2910 = const()[name = tensor<string, []>("op_2910"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2912 = const()[name = tensor<string, []>("op_2912"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_41_pad_type_0 = const()[name = tensor<string, []>("x_41_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_41_pad_0 = const()[name = tensor<string, []>("x_41_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_19_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_19_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7730180608)))];
            tensor<fp16, [1, 10240, 1, 77]> x_41_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2912, groups = var_2803, pad = x_41_pad_0, pad_type = x_41_pad_type_0, strides = var_2910, weight = block_19_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_117_cast_fp16)[name = tensor<string, []>("x_41_cast_fp16")];
            tensor<string, []> var_2926_mode_0 = const()[name = tensor<string, []>("op_2926_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_2926_cast_fp16 = gelu(mode = var_2926_mode_0, x = x_41_cast_fp16)[name = tensor<string, []>("op_2926_cast_fp16")];
            tensor<int32, [2]> var_2929 = const()[name = tensor<string, []>("op_2929"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2931 = const()[name = tensor<string, []>("op_2931"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2933_pad_type_0 = const()[name = tensor<string, []>("op_2933_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2933_pad_0 = const()[name = tensor<string, []>("op_2933_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_19_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_19_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7814066752)))];
            tensor<fp16, [1, 10240, 1, 77]> var_2933_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_2931, groups = var_2803, pad = var_2933_pad_0, pad_type = var_2933_pad_type_0, strides = var_2929, weight = block_19_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_117_cast_fp16)[name = tensor<string, []>("op_2933_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_119_cast_fp16 = mul(x = var_2926_cast_fp16, y = var_2933_cast_fp16)[name = tensor<string, []>("input_119_cast_fp16")];
            tensor<int32, [2]> var_2937 = const()[name = tensor<string, []>("op_2937"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2939 = const()[name = tensor<string, []>("op_2939"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_2941_pad_type_0 = const()[name = tensor<string, []>("op_2941_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_2941_pad_0 = const()[name = tensor<string, []>("op_2941_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_19_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_19_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7897952896)))];
            tensor<fp16, [1, 4096, 1, 77]> var_2941_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2939, groups = var_2803, pad = var_2941_pad_0, pad_type = var_2941_pad_type_0, strides = var_2937, weight = block_19_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_119_cast_fp16)[name = tensor<string, []>("op_2941_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_161_cast_fp16 = add(x = inputs_159_cast_fp16, y = var_2941_cast_fp16)[name = tensor<string, []>("inputs_161_cast_fp16")];
            tensor<bool, []> var_2946 = const()[name = tensor<string, []>("op_2946"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_2947 = const()[name = tensor<string, []>("op_2947"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_2951 = const()[name = tensor<string, []>("op_2951"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_2949_to_fp16 = const()[name = tensor<string, []>("op_2949_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_2948_to_fp16 = const()[name = tensor<string, []>("op_2948_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_163_cast_fp16 = clip(alpha = var_2949_to_fp16, beta = var_2948_to_fp16, x = inputs_161_cast_fp16)[name = tensor<string, []>("inputs_163_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_81_cast_fp16 = mul(x = inputs_163_cast_fp16, y = inputs_163_cast_fp16)[name = tensor<string, []>("inputs_sq_81_cast_fp16")];
            tensor<int32, [1]> var_2968 = const()[name = tensor<string, []>("op_2968"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_81_cast_fp16 = reduce_mean(axes = var_2968, keep_dims = var_2946, x = inputs_sq_81_cast_fp16)[name = tensor<string, []>("variance_81_cast_fp16")];
            tensor<fp16, []> var_2970_to_fp16 = const()[name = tensor<string, []>("op_2970_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_2971_cast_fp16 = add(x = variance_81_cast_fp16, y = var_2970_to_fp16)[name = tensor<string, []>("op_2971_cast_fp16")];
            tensor<fp16, []> var_2972_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_2972_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_2972_cast_fp16 = rsqrt(epsilon = var_2972_epsilon_0_to_fp16, x = var_2971_cast_fp16)[name = tensor<string, []>("op_2972_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_81_cast_fp16 = mul(x = inputs_163_cast_fp16, y = var_2972_cast_fp16)[name = tensor<string, []>("hidden_states_81_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_81_to_fp16 = const()[name = tensor<string, []>("w_81_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7981839040)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_83_cast_fp16 = mul(x = w_81_to_fp16, y = hidden_states_81_cast_fp16)[name = tensor<string, []>("obj_83_cast_fp16")];
            tensor<int32, [2]> var_2986 = const()[name = tensor<string, []>("op_2986"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2988 = const()[name = tensor<string, []>("op_2988"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_41_pad_type_0 = const()[name = tensor<string, []>("query_41_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_41_pad_0 = const()[name = tensor<string, []>("query_41_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_20_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_20_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7981847296)))];
            tensor<fp16, [1, 4096, 1, 77]> query_41_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_2988, groups = var_2947, pad = query_41_pad_0, pad_type = query_41_pad_type_0, strides = var_2986, weight = block_20_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_83_cast_fp16)[name = tensor<string, []>("query_41_cast_fp16")];
            tensor<int32, [2]> var_2992 = const()[name = tensor<string, []>("op_2992"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2994 = const()[name = tensor<string, []>("op_2994"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_41_pad_type_0 = const()[name = tensor<string, []>("key_41_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_41_pad_0 = const()[name = tensor<string, []>("key_41_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_20_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_20_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8015401792)))];
            tensor<fp16, [1, 4096, 1, 77]> key_41_cast_fp16 = conv(dilations = var_2994, groups = var_2947, pad = key_41_pad_0, pad_type = key_41_pad_type_0, strides = var_2992, weight = block_20_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_83_cast_fp16)[name = tensor<string, []>("key_41_cast_fp16")];
            tensor<int32, [2]> var_2999 = const()[name = tensor<string, []>("op_2999"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3001 = const()[name = tensor<string, []>("op_3001"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_41_pad_type_0 = const()[name = tensor<string, []>("value_41_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_41_pad_0 = const()[name = tensor<string, []>("value_41_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_20_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_20_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8048956288)))];
            tensor<fp16, [1, 4096, 1, 77]> value_41_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3001, groups = var_2947, pad = value_41_pad_0, pad_type = value_41_pad_type_0, strides = var_2999, weight = block_20_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_83_cast_fp16)[name = tensor<string, []>("value_41_cast_fp16")];
            tensor<int32, [4]> var_3005 = const()[name = tensor<string, []>("op_3005"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3006_cast_fp16 = reshape(shape = var_3005, x = query_41_cast_fp16)[name = tensor<string, []>("op_3006_cast_fp16")];
            tensor<int32, [4]> var_3007 = const()[name = tensor<string, []>("op_3007"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3008_cast_fp16 = reshape(shape = var_3007, x = key_41_cast_fp16)[name = tensor<string, []>("op_3008_cast_fp16")];
            tensor<bool, []> mh_w_121_transpose_x_0 = const()[name = tensor<string, []>("mh_w_121_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_121_transpose_y_0 = const()[name = tensor<string, []>("mh_w_121_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_121_cast_fp16 = matmul(transpose_x = mh_w_121_transpose_x_0, transpose_y = mh_w_121_transpose_y_0, x = var_3006_cast_fp16, y = var_3008_cast_fp16)[name = tensor<string, []>("mh_w_121_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_123_cast_fp16 = add(x = mh_w_121_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_123_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_125_cast_fp16 = add(x = mh_w_123_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_125_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_3017_cast_fp16 = softmax(axis = var_2951, x = mh_w_125_cast_fp16)[name = tensor<string, []>("op_3017_cast_fp16")];
            tensor<int32, [4]> var_3018 = const()[name = tensor<string, []>("op_3018"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3019_cast_fp16 = reshape(shape = var_3018, x = value_41_cast_fp16)[name = tensor<string, []>("op_3019_cast_fp16")];
            tensor<bool, []> attn_41_transpose_x_0 = const()[name = tensor<string, []>("attn_41_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_41_transpose_y_0 = const()[name = tensor<string, []>("attn_41_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_41_cast_fp16 = matmul(transpose_x = attn_41_transpose_x_0, transpose_y = attn_41_transpose_y_0, x = var_3019_cast_fp16, y = var_3017_cast_fp16)[name = tensor<string, []>("attn_41_cast_fp16")];
            tensor<int32, [4]> var_3022 = const()[name = tensor<string, []>("op_3022"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_121_cast_fp16 = reshape(shape = var_3022, x = attn_41_cast_fp16)[name = tensor<string, []>("input_121_cast_fp16")];
            tensor<int32, [2]> var_3026 = const()[name = tensor<string, []>("op_3026"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3028 = const()[name = tensor<string, []>("op_3028"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_85_pad_type_0 = const()[name = tensor<string, []>("obj_85_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_85_pad_0 = const()[name = tensor<string, []>("obj_85_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_20_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_20_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8082510784)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_85_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3028, groups = var_2947, pad = obj_85_pad_0, pad_type = obj_85_pad_type_0, strides = var_3026, weight = block_20_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_121_cast_fp16)[name = tensor<string, []>("obj_85_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_165_cast_fp16 = add(x = inputs_163_cast_fp16, y = obj_85_cast_fp16)[name = tensor<string, []>("inputs_165_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_167_cast_fp16 = clip(alpha = var_2949_to_fp16, beta = var_2948_to_fp16, x = inputs_165_cast_fp16)[name = tensor<string, []>("inputs_167_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_83_cast_fp16 = mul(x = inputs_167_cast_fp16, y = inputs_167_cast_fp16)[name = tensor<string, []>("inputs_sq_83_cast_fp16")];
            tensor<int32, [1]> var_3037 = const()[name = tensor<string, []>("op_3037"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_83_cast_fp16 = reduce_mean(axes = var_3037, keep_dims = var_2946, x = inputs_sq_83_cast_fp16)[name = tensor<string, []>("variance_83_cast_fp16")];
            tensor<fp16, []> var_3039_to_fp16 = const()[name = tensor<string, []>("op_3039_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_3040_cast_fp16 = add(x = variance_83_cast_fp16, y = var_3039_to_fp16)[name = tensor<string, []>("op_3040_cast_fp16")];
            tensor<fp16, []> var_3041_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_3041_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_3041_cast_fp16 = rsqrt(epsilon = var_3041_epsilon_0_to_fp16, x = var_3040_cast_fp16)[name = tensor<string, []>("op_3041_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_83_cast_fp16 = mul(x = inputs_167_cast_fp16, y = var_3041_cast_fp16)[name = tensor<string, []>("hidden_states_83_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_83_to_fp16 = const()[name = tensor<string, []>("w_83_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8116065280)))];
            tensor<fp16, [1, 4096, 1, 77]> input_123_cast_fp16 = mul(x = w_83_to_fp16, y = hidden_states_83_cast_fp16)[name = tensor<string, []>("input_123_cast_fp16")];
            tensor<int32, [2]> var_3054 = const()[name = tensor<string, []>("op_3054"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3056 = const()[name = tensor<string, []>("op_3056"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_43_pad_type_0 = const()[name = tensor<string, []>("x_43_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_43_pad_0 = const()[name = tensor<string, []>("x_43_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_20_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_20_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8116073536)))];
            tensor<fp16, [1, 10240, 1, 77]> x_43_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_3056, groups = var_2947, pad = x_43_pad_0, pad_type = x_43_pad_type_0, strides = var_3054, weight = block_20_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_123_cast_fp16)[name = tensor<string, []>("x_43_cast_fp16")];
            tensor<string, []> var_3070_mode_0 = const()[name = tensor<string, []>("op_3070_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_3070_cast_fp16 = gelu(mode = var_3070_mode_0, x = x_43_cast_fp16)[name = tensor<string, []>("op_3070_cast_fp16")];
            tensor<int32, [2]> var_3073 = const()[name = tensor<string, []>("op_3073"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3075 = const()[name = tensor<string, []>("op_3075"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_3077_pad_type_0 = const()[name = tensor<string, []>("op_3077_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_3077_pad_0 = const()[name = tensor<string, []>("op_3077_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_20_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_20_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8199959680)))];
            tensor<fp16, [1, 10240, 1, 77]> var_3077_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_3075, groups = var_2947, pad = var_3077_pad_0, pad_type = var_3077_pad_type_0, strides = var_3073, weight = block_20_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_123_cast_fp16)[name = tensor<string, []>("op_3077_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_125_cast_fp16 = mul(x = var_3070_cast_fp16, y = var_3077_cast_fp16)[name = tensor<string, []>("input_125_cast_fp16")];
            tensor<int32, [2]> var_3081 = const()[name = tensor<string, []>("op_3081"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3083 = const()[name = tensor<string, []>("op_3083"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_3085_pad_type_0 = const()[name = tensor<string, []>("op_3085_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_3085_pad_0 = const()[name = tensor<string, []>("op_3085_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_20_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_20_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8283845824)))];
            tensor<fp16, [1, 4096, 1, 77]> var_3085_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3083, groups = var_2947, pad = var_3085_pad_0, pad_type = var_3085_pad_type_0, strides = var_3081, weight = block_20_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_125_cast_fp16)[name = tensor<string, []>("op_3085_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_169_cast_fp16 = add(x = inputs_167_cast_fp16, y = var_3085_cast_fp16)[name = tensor<string, []>("inputs_169_cast_fp16")];
            tensor<bool, []> var_3090 = const()[name = tensor<string, []>("op_3090"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_3091 = const()[name = tensor<string, []>("op_3091"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_3095 = const()[name = tensor<string, []>("op_3095"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_3093_to_fp16 = const()[name = tensor<string, []>("op_3093_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_3092_to_fp16 = const()[name = tensor<string, []>("op_3092_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_171_cast_fp16 = clip(alpha = var_3093_to_fp16, beta = var_3092_to_fp16, x = inputs_169_cast_fp16)[name = tensor<string, []>("inputs_171_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_85_cast_fp16 = mul(x = inputs_171_cast_fp16, y = inputs_171_cast_fp16)[name = tensor<string, []>("inputs_sq_85_cast_fp16")];
            tensor<int32, [1]> var_3112 = const()[name = tensor<string, []>("op_3112"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_85_cast_fp16 = reduce_mean(axes = var_3112, keep_dims = var_3090, x = inputs_sq_85_cast_fp16)[name = tensor<string, []>("variance_85_cast_fp16")];
            tensor<fp16, []> var_3114_to_fp16 = const()[name = tensor<string, []>("op_3114_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_3115_cast_fp16 = add(x = variance_85_cast_fp16, y = var_3114_to_fp16)[name = tensor<string, []>("op_3115_cast_fp16")];
            tensor<fp16, []> var_3116_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_3116_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_3116_cast_fp16 = rsqrt(epsilon = var_3116_epsilon_0_to_fp16, x = var_3115_cast_fp16)[name = tensor<string, []>("op_3116_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_85_cast_fp16 = mul(x = inputs_171_cast_fp16, y = var_3116_cast_fp16)[name = tensor<string, []>("hidden_states_85_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_85_to_fp16 = const()[name = tensor<string, []>("w_85_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8367731968)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_87_cast_fp16 = mul(x = w_85_to_fp16, y = hidden_states_85_cast_fp16)[name = tensor<string, []>("obj_87_cast_fp16")];
            tensor<int32, [2]> var_3130 = const()[name = tensor<string, []>("op_3130"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3132 = const()[name = tensor<string, []>("op_3132"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_43_pad_type_0 = const()[name = tensor<string, []>("query_43_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_43_pad_0 = const()[name = tensor<string, []>("query_43_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_21_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_21_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8367740224)))];
            tensor<fp16, [1, 4096, 1, 77]> query_43_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3132, groups = var_3091, pad = query_43_pad_0, pad_type = query_43_pad_type_0, strides = var_3130, weight = block_21_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_87_cast_fp16)[name = tensor<string, []>("query_43_cast_fp16")];
            tensor<int32, [2]> var_3136 = const()[name = tensor<string, []>("op_3136"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3138 = const()[name = tensor<string, []>("op_3138"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_43_pad_type_0 = const()[name = tensor<string, []>("key_43_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_43_pad_0 = const()[name = tensor<string, []>("key_43_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_21_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_21_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8401294720)))];
            tensor<fp16, [1, 4096, 1, 77]> key_43_cast_fp16 = conv(dilations = var_3138, groups = var_3091, pad = key_43_pad_0, pad_type = key_43_pad_type_0, strides = var_3136, weight = block_21_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_87_cast_fp16)[name = tensor<string, []>("key_43_cast_fp16")];
            tensor<int32, [2]> var_3143 = const()[name = tensor<string, []>("op_3143"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3145 = const()[name = tensor<string, []>("op_3145"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_43_pad_type_0 = const()[name = tensor<string, []>("value_43_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_43_pad_0 = const()[name = tensor<string, []>("value_43_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_21_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_21_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8434849216)))];
            tensor<fp16, [1, 4096, 1, 77]> value_43_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3145, groups = var_3091, pad = value_43_pad_0, pad_type = value_43_pad_type_0, strides = var_3143, weight = block_21_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_87_cast_fp16)[name = tensor<string, []>("value_43_cast_fp16")];
            tensor<int32, [4]> var_3149 = const()[name = tensor<string, []>("op_3149"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3150_cast_fp16 = reshape(shape = var_3149, x = query_43_cast_fp16)[name = tensor<string, []>("op_3150_cast_fp16")];
            tensor<int32, [4]> var_3151 = const()[name = tensor<string, []>("op_3151"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3152_cast_fp16 = reshape(shape = var_3151, x = key_43_cast_fp16)[name = tensor<string, []>("op_3152_cast_fp16")];
            tensor<bool, []> mh_w_127_transpose_x_0 = const()[name = tensor<string, []>("mh_w_127_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_127_transpose_y_0 = const()[name = tensor<string, []>("mh_w_127_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_127_cast_fp16 = matmul(transpose_x = mh_w_127_transpose_x_0, transpose_y = mh_w_127_transpose_y_0, x = var_3150_cast_fp16, y = var_3152_cast_fp16)[name = tensor<string, []>("mh_w_127_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_129_cast_fp16 = add(x = mh_w_127_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_129_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_131_cast_fp16 = add(x = mh_w_129_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_131_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_3161_cast_fp16 = softmax(axis = var_3095, x = mh_w_131_cast_fp16)[name = tensor<string, []>("op_3161_cast_fp16")];
            tensor<int32, [4]> var_3162 = const()[name = tensor<string, []>("op_3162"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3163_cast_fp16 = reshape(shape = var_3162, x = value_43_cast_fp16)[name = tensor<string, []>("op_3163_cast_fp16")];
            tensor<bool, []> attn_43_transpose_x_0 = const()[name = tensor<string, []>("attn_43_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_43_transpose_y_0 = const()[name = tensor<string, []>("attn_43_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_43_cast_fp16 = matmul(transpose_x = attn_43_transpose_x_0, transpose_y = attn_43_transpose_y_0, x = var_3163_cast_fp16, y = var_3161_cast_fp16)[name = tensor<string, []>("attn_43_cast_fp16")];
            tensor<int32, [4]> var_3166 = const()[name = tensor<string, []>("op_3166"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_127_cast_fp16 = reshape(shape = var_3166, x = attn_43_cast_fp16)[name = tensor<string, []>("input_127_cast_fp16")];
            tensor<int32, [2]> var_3170 = const()[name = tensor<string, []>("op_3170"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3172 = const()[name = tensor<string, []>("op_3172"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_89_pad_type_0 = const()[name = tensor<string, []>("obj_89_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_89_pad_0 = const()[name = tensor<string, []>("obj_89_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_21_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_21_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8468403712)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_89_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3172, groups = var_3091, pad = obj_89_pad_0, pad_type = obj_89_pad_type_0, strides = var_3170, weight = block_21_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_127_cast_fp16)[name = tensor<string, []>("obj_89_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_173_cast_fp16 = add(x = inputs_171_cast_fp16, y = obj_89_cast_fp16)[name = tensor<string, []>("inputs_173_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_175_cast_fp16 = clip(alpha = var_3093_to_fp16, beta = var_3092_to_fp16, x = inputs_173_cast_fp16)[name = tensor<string, []>("inputs_175_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_87_cast_fp16 = mul(x = inputs_175_cast_fp16, y = inputs_175_cast_fp16)[name = tensor<string, []>("inputs_sq_87_cast_fp16")];
            tensor<int32, [1]> var_3181 = const()[name = tensor<string, []>("op_3181"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_87_cast_fp16 = reduce_mean(axes = var_3181, keep_dims = var_3090, x = inputs_sq_87_cast_fp16)[name = tensor<string, []>("variance_87_cast_fp16")];
            tensor<fp16, []> var_3183_to_fp16 = const()[name = tensor<string, []>("op_3183_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_3184_cast_fp16 = add(x = variance_87_cast_fp16, y = var_3183_to_fp16)[name = tensor<string, []>("op_3184_cast_fp16")];
            tensor<fp16, []> var_3185_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_3185_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_3185_cast_fp16 = rsqrt(epsilon = var_3185_epsilon_0_to_fp16, x = var_3184_cast_fp16)[name = tensor<string, []>("op_3185_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_87_cast_fp16 = mul(x = inputs_175_cast_fp16, y = var_3185_cast_fp16)[name = tensor<string, []>("hidden_states_87_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_87_to_fp16 = const()[name = tensor<string, []>("w_87_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8501958208)))];
            tensor<fp16, [1, 4096, 1, 77]> input_129_cast_fp16 = mul(x = w_87_to_fp16, y = hidden_states_87_cast_fp16)[name = tensor<string, []>("input_129_cast_fp16")];
            tensor<int32, [2]> var_3198 = const()[name = tensor<string, []>("op_3198"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3200 = const()[name = tensor<string, []>("op_3200"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_45_pad_type_0 = const()[name = tensor<string, []>("x_45_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_45_pad_0 = const()[name = tensor<string, []>("x_45_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_21_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_21_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8501966464)))];
            tensor<fp16, [1, 10240, 1, 77]> x_45_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_3200, groups = var_3091, pad = x_45_pad_0, pad_type = x_45_pad_type_0, strides = var_3198, weight = block_21_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_129_cast_fp16)[name = tensor<string, []>("x_45_cast_fp16")];
            tensor<string, []> var_3214_mode_0 = const()[name = tensor<string, []>("op_3214_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_3214_cast_fp16 = gelu(mode = var_3214_mode_0, x = x_45_cast_fp16)[name = tensor<string, []>("op_3214_cast_fp16")];
            tensor<int32, [2]> var_3217 = const()[name = tensor<string, []>("op_3217"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3219 = const()[name = tensor<string, []>("op_3219"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_3221_pad_type_0 = const()[name = tensor<string, []>("op_3221_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_3221_pad_0 = const()[name = tensor<string, []>("op_3221_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_21_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_21_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8585852608)))];
            tensor<fp16, [1, 10240, 1, 77]> var_3221_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_3219, groups = var_3091, pad = var_3221_pad_0, pad_type = var_3221_pad_type_0, strides = var_3217, weight = block_21_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_129_cast_fp16)[name = tensor<string, []>("op_3221_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_131_cast_fp16 = mul(x = var_3214_cast_fp16, y = var_3221_cast_fp16)[name = tensor<string, []>("input_131_cast_fp16")];
            tensor<int32, [2]> var_3225 = const()[name = tensor<string, []>("op_3225"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3227 = const()[name = tensor<string, []>("op_3227"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_3229_pad_type_0 = const()[name = tensor<string, []>("op_3229_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_3229_pad_0 = const()[name = tensor<string, []>("op_3229_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_21_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_21_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8669738752)))];
            tensor<fp16, [1, 4096, 1, 77]> var_3229_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3227, groups = var_3091, pad = var_3229_pad_0, pad_type = var_3229_pad_type_0, strides = var_3225, weight = block_21_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_131_cast_fp16)[name = tensor<string, []>("op_3229_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_177_cast_fp16 = add(x = inputs_175_cast_fp16, y = var_3229_cast_fp16)[name = tensor<string, []>("inputs_177_cast_fp16")];
            tensor<bool, []> var_3234 = const()[name = tensor<string, []>("op_3234"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_3235 = const()[name = tensor<string, []>("op_3235"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_3239 = const()[name = tensor<string, []>("op_3239"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_3237_to_fp16 = const()[name = tensor<string, []>("op_3237_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_3236_to_fp16 = const()[name = tensor<string, []>("op_3236_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_179_cast_fp16 = clip(alpha = var_3237_to_fp16, beta = var_3236_to_fp16, x = inputs_177_cast_fp16)[name = tensor<string, []>("inputs_179_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_89_cast_fp16 = mul(x = inputs_179_cast_fp16, y = inputs_179_cast_fp16)[name = tensor<string, []>("inputs_sq_89_cast_fp16")];
            tensor<int32, [1]> var_3256 = const()[name = tensor<string, []>("op_3256"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_89_cast_fp16 = reduce_mean(axes = var_3256, keep_dims = var_3234, x = inputs_sq_89_cast_fp16)[name = tensor<string, []>("variance_89_cast_fp16")];
            tensor<fp16, []> var_3258_to_fp16 = const()[name = tensor<string, []>("op_3258_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_3259_cast_fp16 = add(x = variance_89_cast_fp16, y = var_3258_to_fp16)[name = tensor<string, []>("op_3259_cast_fp16")];
            tensor<fp16, []> var_3260_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_3260_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_3260_cast_fp16 = rsqrt(epsilon = var_3260_epsilon_0_to_fp16, x = var_3259_cast_fp16)[name = tensor<string, []>("op_3260_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_89_cast_fp16 = mul(x = inputs_179_cast_fp16, y = var_3260_cast_fp16)[name = tensor<string, []>("hidden_states_89_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_89_to_fp16 = const()[name = tensor<string, []>("w_89_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8753624896)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_91_cast_fp16 = mul(x = w_89_to_fp16, y = hidden_states_89_cast_fp16)[name = tensor<string, []>("obj_91_cast_fp16")];
            tensor<int32, [2]> var_3274 = const()[name = tensor<string, []>("op_3274"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3276 = const()[name = tensor<string, []>("op_3276"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_45_pad_type_0 = const()[name = tensor<string, []>("query_45_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_45_pad_0 = const()[name = tensor<string, []>("query_45_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_22_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_22_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8753633152)))];
            tensor<fp16, [1, 4096, 1, 77]> query_45_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3276, groups = var_3235, pad = query_45_pad_0, pad_type = query_45_pad_type_0, strides = var_3274, weight = block_22_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_91_cast_fp16)[name = tensor<string, []>("query_45_cast_fp16")];
            tensor<int32, [2]> var_3280 = const()[name = tensor<string, []>("op_3280"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3282 = const()[name = tensor<string, []>("op_3282"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_45_pad_type_0 = const()[name = tensor<string, []>("key_45_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_45_pad_0 = const()[name = tensor<string, []>("key_45_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_22_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_22_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8787187648)))];
            tensor<fp16, [1, 4096, 1, 77]> key_45_cast_fp16 = conv(dilations = var_3282, groups = var_3235, pad = key_45_pad_0, pad_type = key_45_pad_type_0, strides = var_3280, weight = block_22_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_91_cast_fp16)[name = tensor<string, []>("key_45_cast_fp16")];
            tensor<int32, [2]> var_3287 = const()[name = tensor<string, []>("op_3287"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3289 = const()[name = tensor<string, []>("op_3289"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_45_pad_type_0 = const()[name = tensor<string, []>("value_45_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_45_pad_0 = const()[name = tensor<string, []>("value_45_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_22_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_22_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8820742144)))];
            tensor<fp16, [1, 4096, 1, 77]> value_45_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3289, groups = var_3235, pad = value_45_pad_0, pad_type = value_45_pad_type_0, strides = var_3287, weight = block_22_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_91_cast_fp16)[name = tensor<string, []>("value_45_cast_fp16")];
            tensor<int32, [4]> var_3293 = const()[name = tensor<string, []>("op_3293"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3294_cast_fp16 = reshape(shape = var_3293, x = query_45_cast_fp16)[name = tensor<string, []>("op_3294_cast_fp16")];
            tensor<int32, [4]> var_3295 = const()[name = tensor<string, []>("op_3295"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3296_cast_fp16 = reshape(shape = var_3295, x = key_45_cast_fp16)[name = tensor<string, []>("op_3296_cast_fp16")];
            tensor<bool, []> mh_w_133_transpose_x_0 = const()[name = tensor<string, []>("mh_w_133_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_133_transpose_y_0 = const()[name = tensor<string, []>("mh_w_133_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_133_cast_fp16 = matmul(transpose_x = mh_w_133_transpose_x_0, transpose_y = mh_w_133_transpose_y_0, x = var_3294_cast_fp16, y = var_3296_cast_fp16)[name = tensor<string, []>("mh_w_133_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_135_cast_fp16 = add(x = mh_w_133_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_135_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_137_cast_fp16 = add(x = mh_w_135_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_137_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_3305_cast_fp16 = softmax(axis = var_3239, x = mh_w_137_cast_fp16)[name = tensor<string, []>("op_3305_cast_fp16")];
            tensor<int32, [4]> var_3306 = const()[name = tensor<string, []>("op_3306"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3307_cast_fp16 = reshape(shape = var_3306, x = value_45_cast_fp16)[name = tensor<string, []>("op_3307_cast_fp16")];
            tensor<bool, []> attn_45_transpose_x_0 = const()[name = tensor<string, []>("attn_45_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_45_transpose_y_0 = const()[name = tensor<string, []>("attn_45_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_45_cast_fp16 = matmul(transpose_x = attn_45_transpose_x_0, transpose_y = attn_45_transpose_y_0, x = var_3307_cast_fp16, y = var_3305_cast_fp16)[name = tensor<string, []>("attn_45_cast_fp16")];
            tensor<int32, [4]> var_3310 = const()[name = tensor<string, []>("op_3310"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_133_cast_fp16 = reshape(shape = var_3310, x = attn_45_cast_fp16)[name = tensor<string, []>("input_133_cast_fp16")];
            tensor<int32, [2]> var_3314 = const()[name = tensor<string, []>("op_3314"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3316 = const()[name = tensor<string, []>("op_3316"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_93_pad_type_0 = const()[name = tensor<string, []>("obj_93_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_93_pad_0 = const()[name = tensor<string, []>("obj_93_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_22_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_22_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8854296640)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_93_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3316, groups = var_3235, pad = obj_93_pad_0, pad_type = obj_93_pad_type_0, strides = var_3314, weight = block_22_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_133_cast_fp16)[name = tensor<string, []>("obj_93_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_181_cast_fp16 = add(x = inputs_179_cast_fp16, y = obj_93_cast_fp16)[name = tensor<string, []>("inputs_181_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_183_cast_fp16 = clip(alpha = var_3237_to_fp16, beta = var_3236_to_fp16, x = inputs_181_cast_fp16)[name = tensor<string, []>("inputs_183_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_91_cast_fp16 = mul(x = inputs_183_cast_fp16, y = inputs_183_cast_fp16)[name = tensor<string, []>("inputs_sq_91_cast_fp16")];
            tensor<int32, [1]> var_3325 = const()[name = tensor<string, []>("op_3325"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_91_cast_fp16 = reduce_mean(axes = var_3325, keep_dims = var_3234, x = inputs_sq_91_cast_fp16)[name = tensor<string, []>("variance_91_cast_fp16")];
            tensor<fp16, []> var_3327_to_fp16 = const()[name = tensor<string, []>("op_3327_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_3328_cast_fp16 = add(x = variance_91_cast_fp16, y = var_3327_to_fp16)[name = tensor<string, []>("op_3328_cast_fp16")];
            tensor<fp16, []> var_3329_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_3329_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_3329_cast_fp16 = rsqrt(epsilon = var_3329_epsilon_0_to_fp16, x = var_3328_cast_fp16)[name = tensor<string, []>("op_3329_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_91_cast_fp16 = mul(x = inputs_183_cast_fp16, y = var_3329_cast_fp16)[name = tensor<string, []>("hidden_states_91_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_91_to_fp16 = const()[name = tensor<string, []>("w_91_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8887851136)))];
            tensor<fp16, [1, 4096, 1, 77]> input_135_cast_fp16 = mul(x = w_91_to_fp16, y = hidden_states_91_cast_fp16)[name = tensor<string, []>("input_135_cast_fp16")];
            tensor<int32, [2]> var_3342 = const()[name = tensor<string, []>("op_3342"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3344 = const()[name = tensor<string, []>("op_3344"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_47_pad_type_0 = const()[name = tensor<string, []>("x_47_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_47_pad_0 = const()[name = tensor<string, []>("x_47_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_22_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_22_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8887859392)))];
            tensor<fp16, [1, 10240, 1, 77]> x_47_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_3344, groups = var_3235, pad = x_47_pad_0, pad_type = x_47_pad_type_0, strides = var_3342, weight = block_22_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_135_cast_fp16)[name = tensor<string, []>("x_47_cast_fp16")];
            tensor<string, []> var_3358_mode_0 = const()[name = tensor<string, []>("op_3358_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_3358_cast_fp16 = gelu(mode = var_3358_mode_0, x = x_47_cast_fp16)[name = tensor<string, []>("op_3358_cast_fp16")];
            tensor<int32, [2]> var_3361 = const()[name = tensor<string, []>("op_3361"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3363 = const()[name = tensor<string, []>("op_3363"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_3365_pad_type_0 = const()[name = tensor<string, []>("op_3365_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_3365_pad_0 = const()[name = tensor<string, []>("op_3365_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_22_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_22_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(8971745536)))];
            tensor<fp16, [1, 10240, 1, 77]> var_3365_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_3363, groups = var_3235, pad = var_3365_pad_0, pad_type = var_3365_pad_type_0, strides = var_3361, weight = block_22_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_135_cast_fp16)[name = tensor<string, []>("op_3365_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_137_cast_fp16 = mul(x = var_3358_cast_fp16, y = var_3365_cast_fp16)[name = tensor<string, []>("input_137_cast_fp16")];
            tensor<int32, [2]> var_3369 = const()[name = tensor<string, []>("op_3369"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3371 = const()[name = tensor<string, []>("op_3371"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_3373_pad_type_0 = const()[name = tensor<string, []>("op_3373_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_3373_pad_0 = const()[name = tensor<string, []>("op_3373_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_22_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_22_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9055631680)))];
            tensor<fp16, [1, 4096, 1, 77]> var_3373_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3371, groups = var_3235, pad = var_3373_pad_0, pad_type = var_3373_pad_type_0, strides = var_3369, weight = block_22_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_137_cast_fp16)[name = tensor<string, []>("op_3373_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_185_cast_fp16 = add(x = inputs_183_cast_fp16, y = var_3373_cast_fp16)[name = tensor<string, []>("inputs_185_cast_fp16")];
            tensor<bool, []> var_3378 = const()[name = tensor<string, []>("op_3378"), val = tensor<bool, []>(true)];
            tensor<int32, []> var_3379 = const()[name = tensor<string, []>("op_3379"), val = tensor<int32, []>(1)];
            tensor<int32, []> var_3383 = const()[name = tensor<string, []>("op_3383"), val = tensor<int32, []>(3)];
            tensor<fp16, []> var_3381_to_fp16 = const()[name = tensor<string, []>("op_3381_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_3380_to_fp16 = const()[name = tensor<string, []>("op_3380_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_187_cast_fp16 = clip(alpha = var_3381_to_fp16, beta = var_3380_to_fp16, x = inputs_185_cast_fp16)[name = tensor<string, []>("inputs_187_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_93_cast_fp16 = mul(x = inputs_187_cast_fp16, y = inputs_187_cast_fp16)[name = tensor<string, []>("inputs_sq_93_cast_fp16")];
            tensor<int32, [1]> var_3400 = const()[name = tensor<string, []>("op_3400"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_93_cast_fp16 = reduce_mean(axes = var_3400, keep_dims = var_3378, x = inputs_sq_93_cast_fp16)[name = tensor<string, []>("variance_93_cast_fp16")];
            tensor<fp16, []> var_3402_to_fp16 = const()[name = tensor<string, []>("op_3402_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_3403_cast_fp16 = add(x = variance_93_cast_fp16, y = var_3402_to_fp16)[name = tensor<string, []>("op_3403_cast_fp16")];
            tensor<fp16, []> var_3404_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_3404_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_3404_cast_fp16 = rsqrt(epsilon = var_3404_epsilon_0_to_fp16, x = var_3403_cast_fp16)[name = tensor<string, []>("op_3404_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_93_cast_fp16 = mul(x = inputs_187_cast_fp16, y = var_3404_cast_fp16)[name = tensor<string, []>("hidden_states_93_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_93_to_fp16 = const()[name = tensor<string, []>("w_93_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9139517824)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_95_cast_fp16 = mul(x = w_93_to_fp16, y = hidden_states_93_cast_fp16)[name = tensor<string, []>("obj_95_cast_fp16")];
            tensor<int32, [2]> var_3418 = const()[name = tensor<string, []>("op_3418"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3420 = const()[name = tensor<string, []>("op_3420"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_pad_type_0 = const()[name = tensor<string, []>("query_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_pad_0 = const()[name = tensor<string, []>("query_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_23_layer_0_SelfAttention_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_23_layer_0_SelfAttention_q_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9139526080)))];
            tensor<fp16, [1, 4096, 1, 77]> query_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3420, groups = var_3379, pad = query_pad_0, pad_type = query_pad_type_0, strides = var_3418, weight = block_23_layer_0_SelfAttention_q_proj_weight_to_fp16, x = obj_95_cast_fp16)[name = tensor<string, []>("query_cast_fp16")];
            tensor<int32, [2]> var_3424 = const()[name = tensor<string, []>("op_3424"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3426 = const()[name = tensor<string, []>("op_3426"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_pad_type_0 = const()[name = tensor<string, []>("key_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_pad_0 = const()[name = tensor<string, []>("key_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_23_layer_0_SelfAttention_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_23_layer_0_SelfAttention_k_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9173080576)))];
            tensor<fp16, [1, 4096, 1, 77]> key_cast_fp16 = conv(dilations = var_3426, groups = var_3379, pad = key_pad_0, pad_type = key_pad_type_0, strides = var_3424, weight = block_23_layer_0_SelfAttention_k_proj_weight_to_fp16, x = obj_95_cast_fp16)[name = tensor<string, []>("key_cast_fp16")];
            tensor<int32, [2]> var_3431 = const()[name = tensor<string, []>("op_3431"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3433 = const()[name = tensor<string, []>("op_3433"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_pad_type_0 = const()[name = tensor<string, []>("value_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_pad_0 = const()[name = tensor<string, []>("value_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_23_layer_0_SelfAttention_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_23_layer_0_SelfAttention_v_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9206635072)))];
            tensor<fp16, [1, 4096, 1, 77]> value_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3433, groups = var_3379, pad = value_pad_0, pad_type = value_pad_type_0, strides = var_3431, weight = block_23_layer_0_SelfAttention_v_proj_weight_to_fp16, x = obj_95_cast_fp16)[name = tensor<string, []>("value_cast_fp16")];
            tensor<int32, [4]> var_3437 = const()[name = tensor<string, []>("op_3437"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3438_cast_fp16 = reshape(shape = var_3437, x = query_cast_fp16)[name = tensor<string, []>("op_3438_cast_fp16")];
            tensor<int32, [4]> var_3439 = const()[name = tensor<string, []>("op_3439"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3440_cast_fp16 = reshape(shape = var_3439, x = key_cast_fp16)[name = tensor<string, []>("op_3440_cast_fp16")];
            tensor<bool, []> mh_w_139_transpose_x_0 = const()[name = tensor<string, []>("mh_w_139_transpose_x_0"), val = tensor<bool, []>(true)];
            tensor<bool, []> mh_w_139_transpose_y_0 = const()[name = tensor<string, []>("mh_w_139_transpose_y_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 77, 77]> mh_w_139_cast_fp16 = matmul(transpose_x = mh_w_139_transpose_x_0, transpose_y = mh_w_139_transpose_y_0, x = var_3438_cast_fp16, y = var_3440_cast_fp16)[name = tensor<string, []>("mh_w_139_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_141_cast_fp16 = add(x = mh_w_139_cast_fp16, y = var_133_cast_fp16)[name = tensor<string, []>("mh_w_141_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> mh_w_cast_fp16 = add(x = mh_w_141_cast_fp16, y = relative_attention_bias_to_fp16)[name = tensor<string, []>("mh_w_cast_fp16")];
            tensor<fp16, [1, 64, 77, 77]> var_3449_cast_fp16 = softmax(axis = var_3383, x = mh_w_cast_fp16)[name = tensor<string, []>("op_3449_cast_fp16")];
            tensor<int32, [4]> var_3450 = const()[name = tensor<string, []>("op_3450"), val = tensor<int32, [4]>([1, 64, 64, -1])];
            tensor<fp16, [1, 64, 64, 77]> var_3451_cast_fp16 = reshape(shape = var_3450, x = value_cast_fp16)[name = tensor<string, []>("op_3451_cast_fp16")];
            tensor<bool, []> attn_transpose_x_0 = const()[name = tensor<string, []>("attn_transpose_x_0"), val = tensor<bool, []>(false)];
            tensor<bool, []> attn_transpose_y_0 = const()[name = tensor<string, []>("attn_transpose_y_0"), val = tensor<bool, []>(true)];
            tensor<fp16, [1, 64, 64, 77]> attn_cast_fp16 = matmul(transpose_x = attn_transpose_x_0, transpose_y = attn_transpose_y_0, x = var_3451_cast_fp16, y = var_3449_cast_fp16)[name = tensor<string, []>("attn_cast_fp16")];
            tensor<int32, [4]> var_3454 = const()[name = tensor<string, []>("op_3454"), val = tensor<int32, [4]>([1, 4096, 1, -1])];
            tensor<fp16, [1, 4096, 1, 77]> input_139_cast_fp16 = reshape(shape = var_3454, x = attn_cast_fp16)[name = tensor<string, []>("input_139_cast_fp16")];
            tensor<int32, [2]> var_3458 = const()[name = tensor<string, []>("op_3458"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3460 = const()[name = tensor<string, []>("op_3460"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_pad_type_0 = const()[name = tensor<string, []>("obj_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_pad_0 = const()[name = tensor<string, []>("obj_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 4096, 1, 1]> block_23_layer_0_SelfAttention_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("block_23_layer_0_SelfAttention_o_proj_weight_to_fp16"), val = tensor<fp16, [4096, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9240189568)))];
            tensor<fp16, [1, 4096, 1, 77]> obj_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3460, groups = var_3379, pad = obj_pad_0, pad_type = obj_pad_type_0, strides = var_3458, weight = block_23_layer_0_SelfAttention_o_proj_weight_to_fp16, x = input_139_cast_fp16)[name = tensor<string, []>("obj_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_189_cast_fp16 = add(x = inputs_187_cast_fp16, y = obj_cast_fp16)[name = tensor<string, []>("inputs_189_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_191_cast_fp16 = clip(alpha = var_3381_to_fp16, beta = var_3380_to_fp16, x = inputs_189_cast_fp16)[name = tensor<string, []>("inputs_191_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_95_cast_fp16 = mul(x = inputs_191_cast_fp16, y = inputs_191_cast_fp16)[name = tensor<string, []>("inputs_sq_95_cast_fp16")];
            tensor<int32, [1]> var_3469 = const()[name = tensor<string, []>("op_3469"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_95_cast_fp16 = reduce_mean(axes = var_3469, keep_dims = var_3378, x = inputs_sq_95_cast_fp16)[name = tensor<string, []>("variance_95_cast_fp16")];
            tensor<fp16, []> var_3471_to_fp16 = const()[name = tensor<string, []>("op_3471_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_3472_cast_fp16 = add(x = variance_95_cast_fp16, y = var_3471_to_fp16)[name = tensor<string, []>("op_3472_cast_fp16")];
            tensor<fp16, []> var_3473_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_3473_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_3473_cast_fp16 = rsqrt(epsilon = var_3473_epsilon_0_to_fp16, x = var_3472_cast_fp16)[name = tensor<string, []>("op_3473_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_95_cast_fp16 = mul(x = inputs_191_cast_fp16, y = var_3473_cast_fp16)[name = tensor<string, []>("hidden_states_95_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_95_to_fp16 = const()[name = tensor<string, []>("w_95_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9273744064)))];
            tensor<fp16, [1, 4096, 1, 77]> input_141_cast_fp16 = mul(x = w_95_to_fp16, y = hidden_states_95_cast_fp16)[name = tensor<string, []>("input_141_cast_fp16")];
            tensor<int32, [2]> var_3486 = const()[name = tensor<string, []>("op_3486"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3488 = const()[name = tensor<string, []>("op_3488"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> x_pad_type_0 = const()[name = tensor<string, []>("x_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> x_pad_0 = const()[name = tensor<string, []>("x_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_23_layer_1_DenseReluDense_wi_0_weight_to_fp16 = const()[name = tensor<string, []>("block_23_layer_1_DenseReluDense_wi_0_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9273752320)))];
            tensor<fp16, [1, 10240, 1, 77]> x_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_3488, groups = var_3379, pad = x_pad_0, pad_type = x_pad_type_0, strides = var_3486, weight = block_23_layer_1_DenseReluDense_wi_0_weight_to_fp16, x = input_141_cast_fp16)[name = tensor<string, []>("x_cast_fp16")];
            tensor<string, []> var_3502_mode_0 = const()[name = tensor<string, []>("op_3502_mode_0"), val = tensor<string, []>("TANH_APPROXIMATION")];
            tensor<fp16, [1, 10240, 1, 77]> var_3502_cast_fp16 = gelu(mode = var_3502_mode_0, x = x_cast_fp16)[name = tensor<string, []>("op_3502_cast_fp16")];
            tensor<int32, [2]> var_3505 = const()[name = tensor<string, []>("op_3505"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3507 = const()[name = tensor<string, []>("op_3507"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_3509_pad_type_0 = const()[name = tensor<string, []>("op_3509_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_3509_pad_0 = const()[name = tensor<string, []>("op_3509_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [10240, 4096, 1, 1]> block_23_layer_1_DenseReluDense_wi_1_weight_to_fp16 = const()[name = tensor<string, []>("block_23_layer_1_DenseReluDense_wi_1_weight_to_fp16"), val = tensor<fp16, [10240, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9357638464)))];
            tensor<fp16, [1, 10240, 1, 77]> var_3509_cast_fp16 = conv(bias = block_0_layer_1_DenseReluDense_wi_0_bias_to_fp16, dilations = var_3507, groups = var_3379, pad = var_3509_pad_0, pad_type = var_3509_pad_type_0, strides = var_3505, weight = block_23_layer_1_DenseReluDense_wi_1_weight_to_fp16, x = input_141_cast_fp16)[name = tensor<string, []>("op_3509_cast_fp16")];
            tensor<fp16, [1, 10240, 1, 77]> input_cast_fp16 = mul(x = var_3502_cast_fp16, y = var_3509_cast_fp16)[name = tensor<string, []>("input_cast_fp16")];
            tensor<int32, [2]> var_3513 = const()[name = tensor<string, []>("op_3513"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3515 = const()[name = tensor<string, []>("op_3515"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> var_3517_pad_type_0 = const()[name = tensor<string, []>("op_3517_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_3517_pad_0 = const()[name = tensor<string, []>("op_3517_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [4096, 10240, 1, 1]> block_23_layer_1_DenseReluDense_wo_weight_to_fp16 = const()[name = tensor<string, []>("block_23_layer_1_DenseReluDense_wo_weight_to_fp16"), val = tensor<fp16, [4096, 10240, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9441524608)))];
            tensor<fp16, [1, 4096, 1, 77]> var_3517_cast_fp16 = conv(bias = block_0_layer_0_SelfAttention_q_proj_bias_to_fp16, dilations = var_3515, groups = var_3379, pad = var_3517_pad_0, pad_type = var_3517_pad_type_0, strides = var_3513, weight = block_23_layer_1_DenseReluDense_wo_weight_to_fp16, x = input_cast_fp16)[name = tensor<string, []>("op_3517_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_193_cast_fp16 = add(x = inputs_191_cast_fp16, y = var_3517_cast_fp16)[name = tensor<string, []>("inputs_193_cast_fp16")];
            tensor<bool, []> var_3521 = const()[name = tensor<string, []>("op_3521"), val = tensor<bool, []>(true)];
            tensor<fp16, []> var_3524_to_fp16 = const()[name = tensor<string, []>("op_3524_to_fp16"), val = tensor<fp16, []>(-0x1.b18p+15)];
            tensor<fp16, []> var_3523_to_fp16 = const()[name = tensor<string, []>("op_3523_to_fp16"), val = tensor<fp16, []>(0x1.b18p+15)];
            tensor<fp16, [1, 4096, 1, 77]> inputs_cast_fp16 = clip(alpha = var_3524_to_fp16, beta = var_3523_to_fp16, x = inputs_193_cast_fp16)[name = tensor<string, []>("inputs_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> inputs_sq_cast_fp16 = mul(x = inputs_cast_fp16, y = inputs_cast_fp16)[name = tensor<string, []>("inputs_sq_cast_fp16")];
            tensor<int32, [1]> var_3528 = const()[name = tensor<string, []>("op_3528"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 77]> variance_cast_fp16 = reduce_mean(axes = var_3528, keep_dims = var_3521, x = inputs_sq_cast_fp16)[name = tensor<string, []>("variance_cast_fp16")];
            tensor<fp16, []> var_3530_to_fp16 = const()[name = tensor<string, []>("op_3530_to_fp16"), val = tensor<fp16, []>(0x1.1p-20)];
            tensor<fp16, [1, 1, 1, 77]> var_3531_cast_fp16 = add(x = variance_cast_fp16, y = var_3530_to_fp16)[name = tensor<string, []>("op_3531_cast_fp16")];
            tensor<fp16, []> var_3532_epsilon_0_to_fp16 = const()[name = tensor<string, []>("op_3532_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 77]> var_3532_cast_fp16 = rsqrt(epsilon = var_3532_epsilon_0_to_fp16, x = var_3531_cast_fp16)[name = tensor<string, []>("op_3532_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 77]> hidden_states_cast_fp16 = mul(x = inputs_cast_fp16, y = var_3532_cast_fp16)[name = tensor<string, []>("hidden_states_cast_fp16")];
            tensor<fp16, [1, 4096, 1, 1]> w_to_fp16 = const()[name = tensor<string, []>("w_to_fp16"), val = tensor<fp16, [1, 4096, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9525410752)))];
            tensor<fp16, [1, 4096, 1, 77]> encoder_hidden_states = mul(x = w_to_fp16, y = hidden_states_cast_fp16)[name = tensor<string, []>("op_3536_cast_fp16")];
        } -> (encoder_hidden_states);
}