Skip to content

Instantly share code, notes, and snippets.

Show Gist options
  • Save AmosLewis/ecef37756ebf1cc6ee0eb3d99b9b231d to your computer and use it in GitHub Desktop.
Save AmosLewis/ecef37756ebf1cc6ee0eb3d99b9b231d to your computer and use it in GitHub Desktop.
module {
func.func @main_graph(%arg0: !torch.vtensor<[1,7],si64>) -> (!torch.vtensor<[1,7,50257],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>) attributes {torch.onnx_meta.ir_version = 8 : si64, torch.onnx_meta.opset_version = 17 : si64, torch.onnx_meta.producer_name = "pytorch", torch.onnx_meta.producer_version = "2.4.0"} {
%0 = torch.vtensor.literal(dense_resource<__elided__> : tensor<50257x1600xf32>) : !torch.vtensor<[50257,1600],f32>
%1 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1024x1600xf32>) : !torch.vtensor<[1024,1600],f32>
%2 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%3 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%4 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%5 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%6 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%7 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%8 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%9 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%10 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%11 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%12 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%13 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%14 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%15 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%16 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%17 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%18 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%19 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%20 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%21 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%22 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%23 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%24 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%25 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%26 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%27 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%28 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%29 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%30 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%31 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%32 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%33 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%34 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%35 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%36 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%37 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%38 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%39 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%40 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%41 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%42 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%43 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%44 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%45 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%46 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%47 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%48 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%49 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%50 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%51 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%52 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%53 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%54 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%55 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%56 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%57 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%58 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%59 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%60 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%61 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%62 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%63 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%64 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%65 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%66 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%67 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%68 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%69 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%70 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%71 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%72 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%73 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%74 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%75 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%76 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%77 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%78 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%79 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%80 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%81 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%82 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%83 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%84 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%85 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%86 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%87 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%88 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%89 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%90 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%91 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%92 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%93 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%94 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%95 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%96 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%97 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%98 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%99 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%100 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%101 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%102 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%103 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%104 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%105 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%106 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%107 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%108 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%109 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%110 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%111 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%112 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%113 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%114 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%115 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%116 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%117 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%118 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%119 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%120 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%121 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%122 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%123 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%124 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%125 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%126 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%127 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%128 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%129 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%130 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%131 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%132 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%133 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%134 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%135 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%136 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%137 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%138 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%139 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%140 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%141 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%142 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%143 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%144 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%145 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%146 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%147 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%148 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%149 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%150 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%151 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%152 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%153 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%154 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%155 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%156 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%157 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%158 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%159 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%160 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%161 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%162 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%163 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%164 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%165 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%166 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%167 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%168 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%169 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%170 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%171 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%172 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%173 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%174 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%175 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%176 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%177 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%178 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%179 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%180 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%181 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%182 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%183 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%184 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%185 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%186 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%187 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%188 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%189 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%190 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%191 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%192 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%193 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%194 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%195 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%196 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%197 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%198 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%199 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%200 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%201 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%202 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%203 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%204 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%205 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%206 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%207 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%208 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%209 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%210 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%211 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%212 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%213 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%214 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%215 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%216 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%217 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%218 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%219 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%220 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%221 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%222 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%223 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%224 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%225 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%226 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%227 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%228 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%229 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%230 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%231 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%232 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%233 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%234 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%235 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%236 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%237 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%238 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%239 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%240 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%241 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%242 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%243 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%244 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%245 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%246 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%247 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%248 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%249 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%250 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%251 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%252 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%253 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%254 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%255 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%256 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%257 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%258 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%259 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%260 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%261 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%262 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%263 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%264 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%265 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%266 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%267 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%268 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%269 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%270 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%271 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%272 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%273 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%274 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%275 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%276 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%277 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%278 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%279 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%280 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%281 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%282 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%283 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%284 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%285 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%286 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%287 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%288 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%289 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%290 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%291 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%292 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%293 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%294 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%295 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%296 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%297 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%298 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%299 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%300 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%301 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%302 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%303 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%304 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%305 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%306 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%307 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%308 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%309 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%310 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%311 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%312 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%313 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%314 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%315 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%316 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%317 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%318 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%319 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%320 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%321 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%322 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%323 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%324 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%325 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%326 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%327 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%328 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%329 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%330 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%331 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%332 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%333 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%334 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%335 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%336 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%337 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%338 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%339 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%340 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%341 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%342 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%343 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%344 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%345 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%346 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%347 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%348 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%349 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%350 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%351 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%352 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%353 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%354 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%355 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%356 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%357 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%358 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%359 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%360 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%361 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%362 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%363 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%364 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%365 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%366 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%367 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%368 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%369 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%370 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%371 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%372 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%373 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%374 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%375 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%376 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%377 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%378 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%379 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%380 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%381 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%382 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%383 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%384 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%385 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%386 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%387 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%388 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%389 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%390 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%391 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%392 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%393 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%394 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%395 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%396 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%397 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%398 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%399 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%400 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%401 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%402 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%403 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%404 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%405 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%406 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%407 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%408 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%409 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%410 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%411 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%412 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%413 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%414 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%415 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%416 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%417 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%418 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%419 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%420 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%421 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%422 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%423 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%424 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%425 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%426 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%427 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%428 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%429 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%430 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%431 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%432 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%433 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%434 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%435 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%436 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%437 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%438 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%439 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%440 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%441 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%442 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%443 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%444 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%445 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%446 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%447 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%448 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%449 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%450 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%451 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%452 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%453 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%454 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%455 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%456 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%457 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%458 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%459 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%460 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%461 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%462 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%463 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%464 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%465 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%466 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%467 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%468 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%469 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%470 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%471 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%472 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%473 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%474 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%475 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%476 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%477 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%478 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%479 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%480 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%481 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%482 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%483 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%484 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%485 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%486 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%487 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%488 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%489 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%490 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%491 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%492 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%493 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%494 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%495 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%496 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%497 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%498 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%499 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%500 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%501 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%502 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%503 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%504 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%505 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%506 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%507 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%508 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%509 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%510 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%511 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%512 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%513 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%514 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%515 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%516 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%517 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%518 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%519 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%520 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%521 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%522 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%523 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%524 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%525 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%526 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%527 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%528 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%529 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%530 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%531 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%532 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%533 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%534 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%535 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%536 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%537 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%538 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%539 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%540 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%541 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%542 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%543 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%544 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%545 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%546 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%547 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%548 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%549 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%550 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%551 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%552 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%553 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%554 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%555 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%556 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%557 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%558 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%559 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%560 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%561 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%562 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%563 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%564 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%565 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%566 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%567 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%568 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x4800xf32>) : !torch.vtensor<[1600,4800],f32>
%569 = torch.vtensor.literal(dense_resource<__elided__> : tensor<4800xf32>) : !torch.vtensor<[4800],f32>
%570 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x1600xf32>) : !torch.vtensor<[1600,1600],f32>
%571 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%572 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%573 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%574 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x6400xf32>) : !torch.vtensor<[1600,6400],f32>
%575 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400xf32>) : !torch.vtensor<[6400],f32>
%576 = torch.vtensor.literal(dense_resource<__elided__> : tensor<6400x1600xf32>) : !torch.vtensor<[6400,1600],f32>
%577 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%578 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%579 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600xf32>) : !torch.vtensor<[1600],f32>
%580 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1600x50257xf32>) : !torch.vtensor<[1600,50257],f32>
%none = torch.constant.none
%581 = torch.vtensor.literal(dense<[-1, 7]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int1 = torch.constant.int 1
%int7 = torch.constant.int 7
%582 = torch.prim.ListConstruct %int1, %int7 : (!torch.int, !torch.int) -> !torch.list<int>
%583 = torch.aten.reshape %arg0, %582 : !torch.vtensor<[1,7],si64>, !torch.list<int> -> !torch.vtensor<[1,7],si64>
%584 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x7xsi64>) : !torch.vtensor<[1,7],si64>
%int0 = torch.constant.int 0
%int0_0 = torch.constant.int 0
%int1_1 = torch.constant.int 1
%585 = torch.aten.lt.Scalar %583, %int0_0 : !torch.vtensor<[1,7],si64>, !torch.int -> !torch.vtensor<[1,7],i1>
%586 = torch.aten.size.int %0, %int0 : !torch.vtensor<[50257,1600],f32>, !torch.int -> !torch.int
%587 = torch.aten.add.Scalar %583, %586, %int1_1 : !torch.vtensor<[1,7],si64>, !torch.int, !torch.int -> !torch.vtensor<[1,7],si64>
%588 = torch.aten.where.self %585, %587, %583 : !torch.vtensor<[1,7],i1>, !torch.vtensor<[1,7],si64>, !torch.vtensor<[1,7],si64> -> !torch.vtensor<[1,7],si64>
%int0_2 = torch.constant.int 0
%589 = torch.aten.size.int %588, %int0_2 : !torch.vtensor<[1,7],si64>, !torch.int -> !torch.int
%int1_3 = torch.constant.int 1
%590 = torch.aten.size.int %588, %int1_3 : !torch.vtensor<[1,7],si64>, !torch.int -> !torch.int
%591 = torch.prim.ListConstruct %589, %590 : (!torch.int, !torch.int) -> !torch.list<int>
%592 = torch.aten.dim %588 : !torch.vtensor<[1,7],si64> -> !torch.int
%593 = torch.aten.sub.int %592, %int1_1 : !torch.int, !torch.int -> !torch.int
%594 = torch.aten.flatten.using_ints %588, %int0_0, %593 : !torch.vtensor<[1,7],si64>, !torch.int, !torch.int -> !torch.vtensor<[7],si64>
%595 = torch.aten.index_select %0, %int0, %594 : !torch.vtensor<[50257,1600],f32>, !torch.int, !torch.vtensor<[7],si64> -> !torch.vtensor<[7,1600],f32>
%596 = torch.aten.unflatten.int %595, %int0, %591 : !torch.vtensor<[7,1600],f32>, !torch.int, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int0_4 = torch.constant.int 0
%int0_5 = torch.constant.int 0
%int1_6 = torch.constant.int 1
%597 = torch.aten.lt.Scalar %584, %int0_5 : !torch.vtensor<[1,7],si64>, !torch.int -> !torch.vtensor<[1,7],i1>
%598 = torch.aten.size.int %1, %int0_4 : !torch.vtensor<[1024,1600],f32>, !torch.int -> !torch.int
%599 = torch.aten.add.Scalar %584, %598, %int1_6 : !torch.vtensor<[1,7],si64>, !torch.int, !torch.int -> !torch.vtensor<[1,7],si64>
%600 = torch.aten.where.self %597, %599, %584 : !torch.vtensor<[1,7],i1>, !torch.vtensor<[1,7],si64>, !torch.vtensor<[1,7],si64> -> !torch.vtensor<[1,7],si64>
%int0_7 = torch.constant.int 0
%601 = torch.aten.size.int %600, %int0_7 : !torch.vtensor<[1,7],si64>, !torch.int -> !torch.int
%int1_8 = torch.constant.int 1
%602 = torch.aten.size.int %600, %int1_8 : !torch.vtensor<[1,7],si64>, !torch.int -> !torch.int
%603 = torch.prim.ListConstruct %601, %602 : (!torch.int, !torch.int) -> !torch.list<int>
%604 = torch.aten.dim %600 : !torch.vtensor<[1,7],si64> -> !torch.int
%605 = torch.aten.sub.int %604, %int1_6 : !torch.int, !torch.int -> !torch.int
%606 = torch.aten.flatten.using_ints %600, %int0_5, %605 : !torch.vtensor<[1,7],si64>, !torch.int, !torch.int -> !torch.vtensor<[7],si64>
%607 = torch.aten.index_select %1, %int0_4, %606 : !torch.vtensor<[1024,1600],f32>, !torch.int, !torch.vtensor<[7],si64> -> !torch.vtensor<[7,1600],f32>
%608 = torch.aten.unflatten.int %607, %int0_4, %603 : !torch.vtensor<[7,1600],f32>, !torch.int, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_9 = torch.constant.int 1
%609 = torch.aten.add.Tensor %596, %608, %int1_9 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06 = torch.constant.float 9.9999997473787516E-6
%int1600 = torch.constant.int 1600
%610 = torch.prim.ListConstruct %int1600 : (!torch.int) -> !torch.list<int>
%result0, %result1, %result2 = torch.aten.native_layer_norm %609, %610, %2, %3, %float9.999990e-06 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%611 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_10 = torch.constant.int 7
%int1600_11 = torch.constant.int 1600
%612 = torch.prim.ListConstruct %int7_10, %int1600_11 : (!torch.int, !torch.int) -> !torch.list<int>
%613 = torch.aten.reshape %result0, %612 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_12 = torch.constant.int 0
%int1_13 = torch.constant.int 1
%614 = torch.aten.mm %613, %4 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%615 = torch.aten.add.Tensor %614, %5, %int1_13 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%616 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_14 = torch.constant.int 1
%int7_15 = torch.constant.int 7
%int4800 = torch.constant.int 4800
%617 = torch.prim.ListConstruct %int1_14, %int7_15, %int4800 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%618 = torch.aten.reshape %615, %617 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%619 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%620 = torch.prim.tolist(%619) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2 = torch.constant.int 2
%621 = torch.aten.split_with_sizes %618, %620, %int2 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%622:3 = torch.prim.ListUnpack %621 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%623 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_16 = torch.constant.int 1
%int7_17 = torch.constant.int 7
%int25 = torch.constant.int 25
%int64 = torch.constant.int 64
%624 = torch.prim.ListConstruct %int1_16, %int7_17, %int25, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%625 = torch.aten.reshape %622#0, %624 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_18 = torch.constant.int 1
%int2_19 = torch.constant.int 2
%626 = torch.aten.transpose.int %625, %int1_18, %int2_19 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%627 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_20 = torch.constant.int 1
%int7_21 = torch.constant.int 7
%int25_22 = torch.constant.int 25
%int64_23 = torch.constant.int 64
%628 = torch.prim.ListConstruct %int1_20, %int7_21, %int25_22, %int64_23 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%629 = torch.aten.reshape %622#1, %628 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_24 = torch.constant.int 1
%int2_25 = torch.constant.int 2
%630 = torch.aten.transpose.int %629, %int1_24, %int2_25 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%631 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_26 = torch.constant.int 1
%int7_27 = torch.constant.int 7
%int25_28 = torch.constant.int 25
%int64_29 = torch.constant.int 64
%632 = torch.prim.ListConstruct %int1_26, %int7_27, %int25_28, %int64_29 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%633 = torch.aten.reshape %622#2, %632 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_30 = torch.constant.int 1
%int2_31 = torch.constant.int 2
%634 = torch.aten.transpose.int %633, %int1_30, %int2_31 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_32 = torch.constant.int 1
%int2_33 = torch.constant.int 2
%635 = torch.aten.transpose.int %629, %int1_32, %int2_33 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_34 = torch.constant.int 2
%int3 = torch.constant.int 3
%636 = torch.aten.transpose.int %635, %int2_34, %int3 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%637 = torch.aten.matmul %626, %636 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%638 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%639 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%640 = torch.aten.pow.Tensor_Tensor %638, %639 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%641 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_35 = torch.constant.int 0
%642 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_36 = torch.constant.none
%float0.000000e00 = torch.constant.float 0.000000e+00
%643 = torch.aten.full %642, %float0.000000e00, %none_36, %none_36, %none_36, %none_36 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_37 = torch.constant.int 1
%644 = torch.aten.add.Tensor %643, %640, %int1_37 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%645 = torch.aten.div.Tensor %637, %644 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%646 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6 = torch.constant.int 6
%none_38 = torch.constant.none
%false = torch.constant.bool false
%647 = torch.aten.to.dtype %645, %int6, %false, %false, %none_38 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%648 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%649 = torch.aten.where.self %646, %647, %648 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_39 = torch.constant.int 3
%none_40 = torch.constant.none
%650 = torch.aten.softmax.int %649, %int3_39, %none_40 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_41 = torch.constant.int 6
%none_42 = torch.constant.none
%false_43 = torch.constant.bool false
%651 = torch.aten.to.dtype %650, %int6_41, %false_43, %false_43, %none_42 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%652 = torch.aten.matmul %651, %634 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_44 = torch.constant.int 1
%int2_45 = torch.constant.int 2
%653 = torch.aten.transpose.int %652, %int1_44, %int2_45 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%654 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_46 = torch.constant.int 1
%int7_47 = torch.constant.int 7
%int1600_48 = torch.constant.int 1600
%655 = torch.prim.ListConstruct %int1_46, %int7_47, %int1600_48 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%656 = torch.aten.reshape %653, %655 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%657 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_49 = torch.constant.int 7
%int1600_50 = torch.constant.int 1600
%658 = torch.prim.ListConstruct %int7_49, %int1600_50 : (!torch.int, !torch.int) -> !torch.list<int>
%659 = torch.aten.reshape %656, %658 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_51 = torch.constant.int 0
%int1_52 = torch.constant.int 1
%660 = torch.aten.mm %659, %6 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%661 = torch.aten.add.Tensor %660, %7, %int1_52 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%662 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_53 = torch.constant.int 1
%int7_54 = torch.constant.int 7
%int1600_55 = torch.constant.int 1600
%663 = torch.prim.ListConstruct %int1_53, %int7_54, %int1600_55 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%664 = torch.aten.reshape %661, %663 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_56 = torch.constant.int 1
%665 = torch.aten.add.Tensor %664, %609, %int1_56 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_57 = torch.constant.float 9.9999997473787516E-6
%int1600_58 = torch.constant.int 1600
%666 = torch.prim.ListConstruct %int1600_58 : (!torch.int) -> !torch.list<int>
%result0_59, %result1_60, %result2_61 = torch.aten.native_layer_norm %665, %666, %8, %9, %float9.999990e-06_57 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%667 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_62 = torch.constant.int 7
%int1600_63 = torch.constant.int 1600
%668 = torch.prim.ListConstruct %int7_62, %int1600_63 : (!torch.int, !torch.int) -> !torch.list<int>
%669 = torch.aten.reshape %result0_59, %668 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_64 = torch.constant.int 0
%int1_65 = torch.constant.int 1
%670 = torch.aten.mm %669, %10 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%671 = torch.aten.add.Tensor %670, %11, %int1_65 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%672 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_66 = torch.constant.int 1
%int7_67 = torch.constant.int 7
%int6400 = torch.constant.int 6400
%673 = torch.prim.ListConstruct %int1_66, %int7_67, %int6400 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%674 = torch.aten.reshape %671, %673 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%675 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%676 = torch.aten.mul.Tensor %674, %675 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%677 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%678 = torch.aten.pow.Tensor_Tensor %674, %677 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%679 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%680 = torch.aten.mul.Tensor %678, %679 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_68 = torch.constant.int 1
%681 = torch.aten.add.Tensor %674, %680, %int1_68 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%682 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%683 = torch.aten.mul.Tensor %681, %682 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%684 = torch.aten.tanh %683 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%685 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_69 = torch.constant.int 1
%686 = torch.aten.add.Tensor %684, %685, %int1_69 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%687 = torch.aten.mul.Tensor %676, %686 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%688 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_70 = torch.constant.int 7
%int6400_71 = torch.constant.int 6400
%689 = torch.prim.ListConstruct %int7_70, %int6400_71 : (!torch.int, !torch.int) -> !torch.list<int>
%690 = torch.aten.reshape %687, %689 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_72 = torch.constant.int 0
%int1_73 = torch.constant.int 1
%691 = torch.aten.mm %690, %12 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%692 = torch.aten.add.Tensor %691, %13, %int1_73 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%693 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_74 = torch.constant.int 1
%int7_75 = torch.constant.int 7
%int1600_76 = torch.constant.int 1600
%694 = torch.prim.ListConstruct %int1_74, %int7_75, %int1600_76 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%695 = torch.aten.reshape %692, %694 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_77 = torch.constant.int 1
%696 = torch.aten.add.Tensor %665, %695, %int1_77 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_78 = torch.constant.float 9.9999997473787516E-6
%int1600_79 = torch.constant.int 1600
%697 = torch.prim.ListConstruct %int1600_79 : (!torch.int) -> !torch.list<int>
%result0_80, %result1_81, %result2_82 = torch.aten.native_layer_norm %696, %697, %14, %15, %float9.999990e-06_78 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%698 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_83 = torch.constant.int 7
%int1600_84 = torch.constant.int 1600
%699 = torch.prim.ListConstruct %int7_83, %int1600_84 : (!torch.int, !torch.int) -> !torch.list<int>
%700 = torch.aten.reshape %result0_80, %699 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_85 = torch.constant.int 0
%int1_86 = torch.constant.int 1
%701 = torch.aten.mm %700, %16 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%702 = torch.aten.add.Tensor %701, %17, %int1_86 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%703 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_87 = torch.constant.int 1
%int7_88 = torch.constant.int 7
%int4800_89 = torch.constant.int 4800
%704 = torch.prim.ListConstruct %int1_87, %int7_88, %int4800_89 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%705 = torch.aten.reshape %702, %704 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%706 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%707 = torch.prim.tolist(%706) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_90 = torch.constant.int 2
%708 = torch.aten.split_with_sizes %705, %707, %int2_90 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%709:3 = torch.prim.ListUnpack %708 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%710 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_91 = torch.constant.int 1
%int7_92 = torch.constant.int 7
%int25_93 = torch.constant.int 25
%int64_94 = torch.constant.int 64
%711 = torch.prim.ListConstruct %int1_91, %int7_92, %int25_93, %int64_94 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%712 = torch.aten.reshape %709#0, %711 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_95 = torch.constant.int 1
%int2_96 = torch.constant.int 2
%713 = torch.aten.transpose.int %712, %int1_95, %int2_96 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%714 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_97 = torch.constant.int 1
%int7_98 = torch.constant.int 7
%int25_99 = torch.constant.int 25
%int64_100 = torch.constant.int 64
%715 = torch.prim.ListConstruct %int1_97, %int7_98, %int25_99, %int64_100 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%716 = torch.aten.reshape %709#1, %715 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_101 = torch.constant.int 1
%int2_102 = torch.constant.int 2
%717 = torch.aten.transpose.int %716, %int1_101, %int2_102 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%718 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_103 = torch.constant.int 1
%int7_104 = torch.constant.int 7
%int25_105 = torch.constant.int 25
%int64_106 = torch.constant.int 64
%719 = torch.prim.ListConstruct %int1_103, %int7_104, %int25_105, %int64_106 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%720 = torch.aten.reshape %709#2, %719 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_107 = torch.constant.int 1
%int2_108 = torch.constant.int 2
%721 = torch.aten.transpose.int %720, %int1_107, %int2_108 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_109 = torch.constant.int 1
%int2_110 = torch.constant.int 2
%722 = torch.aten.transpose.int %716, %int1_109, %int2_110 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_111 = torch.constant.int 2
%int3_112 = torch.constant.int 3
%723 = torch.aten.transpose.int %722, %int2_111, %int3_112 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%724 = torch.aten.matmul %713, %723 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%725 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%726 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%727 = torch.aten.pow.Tensor_Tensor %725, %726 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%728 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_113 = torch.constant.int 0
%729 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_114 = torch.constant.none
%float0.000000e00_115 = torch.constant.float 0.000000e+00
%730 = torch.aten.full %729, %float0.000000e00_115, %none_114, %none_114, %none_114, %none_114 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_116 = torch.constant.int 1
%731 = torch.aten.add.Tensor %730, %727, %int1_116 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%732 = torch.aten.div.Tensor %724, %731 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%733 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_117 = torch.constant.int 6
%none_118 = torch.constant.none
%false_119 = torch.constant.bool false
%734 = torch.aten.to.dtype %732, %int6_117, %false_119, %false_119, %none_118 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%735 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%736 = torch.aten.where.self %733, %734, %735 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_120 = torch.constant.int 3
%none_121 = torch.constant.none
%737 = torch.aten.softmax.int %736, %int3_120, %none_121 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_122 = torch.constant.int 6
%none_123 = torch.constant.none
%false_124 = torch.constant.bool false
%738 = torch.aten.to.dtype %737, %int6_122, %false_124, %false_124, %none_123 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%739 = torch.aten.matmul %738, %721 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_125 = torch.constant.int 1
%int2_126 = torch.constant.int 2
%740 = torch.aten.transpose.int %739, %int1_125, %int2_126 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%741 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_127 = torch.constant.int 1
%int7_128 = torch.constant.int 7
%int1600_129 = torch.constant.int 1600
%742 = torch.prim.ListConstruct %int1_127, %int7_128, %int1600_129 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%743 = torch.aten.reshape %740, %742 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%744 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_130 = torch.constant.int 7
%int1600_131 = torch.constant.int 1600
%745 = torch.prim.ListConstruct %int7_130, %int1600_131 : (!torch.int, !torch.int) -> !torch.list<int>
%746 = torch.aten.reshape %743, %745 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_132 = torch.constant.int 0
%int1_133 = torch.constant.int 1
%747 = torch.aten.mm %746, %18 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%748 = torch.aten.add.Tensor %747, %19, %int1_133 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%749 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_134 = torch.constant.int 1
%int7_135 = torch.constant.int 7
%int1600_136 = torch.constant.int 1600
%750 = torch.prim.ListConstruct %int1_134, %int7_135, %int1600_136 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%751 = torch.aten.reshape %748, %750 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_137 = torch.constant.int 1
%752 = torch.aten.add.Tensor %751, %696, %int1_137 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_138 = torch.constant.float 9.9999997473787516E-6
%int1600_139 = torch.constant.int 1600
%753 = torch.prim.ListConstruct %int1600_139 : (!torch.int) -> !torch.list<int>
%result0_140, %result1_141, %result2_142 = torch.aten.native_layer_norm %752, %753, %20, %21, %float9.999990e-06_138 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%754 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_143 = torch.constant.int 7
%int1600_144 = torch.constant.int 1600
%755 = torch.prim.ListConstruct %int7_143, %int1600_144 : (!torch.int, !torch.int) -> !torch.list<int>
%756 = torch.aten.reshape %result0_140, %755 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_145 = torch.constant.int 0
%int1_146 = torch.constant.int 1
%757 = torch.aten.mm %756, %22 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%758 = torch.aten.add.Tensor %757, %23, %int1_146 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%759 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_147 = torch.constant.int 1
%int7_148 = torch.constant.int 7
%int6400_149 = torch.constant.int 6400
%760 = torch.prim.ListConstruct %int1_147, %int7_148, %int6400_149 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%761 = torch.aten.reshape %758, %760 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%762 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%763 = torch.aten.mul.Tensor %761, %762 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%764 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%765 = torch.aten.pow.Tensor_Tensor %761, %764 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%766 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%767 = torch.aten.mul.Tensor %765, %766 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_150 = torch.constant.int 1
%768 = torch.aten.add.Tensor %761, %767, %int1_150 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%769 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%770 = torch.aten.mul.Tensor %768, %769 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%771 = torch.aten.tanh %770 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%772 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_151 = torch.constant.int 1
%773 = torch.aten.add.Tensor %771, %772, %int1_151 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%774 = torch.aten.mul.Tensor %763, %773 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%775 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_152 = torch.constant.int 7
%int6400_153 = torch.constant.int 6400
%776 = torch.prim.ListConstruct %int7_152, %int6400_153 : (!torch.int, !torch.int) -> !torch.list<int>
%777 = torch.aten.reshape %774, %776 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_154 = torch.constant.int 0
%int1_155 = torch.constant.int 1
%778 = torch.aten.mm %777, %24 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%779 = torch.aten.add.Tensor %778, %25, %int1_155 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%780 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_156 = torch.constant.int 1
%int7_157 = torch.constant.int 7
%int1600_158 = torch.constant.int 1600
%781 = torch.prim.ListConstruct %int1_156, %int7_157, %int1600_158 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%782 = torch.aten.reshape %779, %781 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_159 = torch.constant.int 1
%783 = torch.aten.add.Tensor %752, %782, %int1_159 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_160 = torch.constant.float 9.9999997473787516E-6
%int1600_161 = torch.constant.int 1600
%784 = torch.prim.ListConstruct %int1600_161 : (!torch.int) -> !torch.list<int>
%result0_162, %result1_163, %result2_164 = torch.aten.native_layer_norm %783, %784, %26, %27, %float9.999990e-06_160 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%785 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_165 = torch.constant.int 7
%int1600_166 = torch.constant.int 1600
%786 = torch.prim.ListConstruct %int7_165, %int1600_166 : (!torch.int, !torch.int) -> !torch.list<int>
%787 = torch.aten.reshape %result0_162, %786 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_167 = torch.constant.int 0
%int1_168 = torch.constant.int 1
%788 = torch.aten.mm %787, %28 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%789 = torch.aten.add.Tensor %788, %29, %int1_168 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%790 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_169 = torch.constant.int 1
%int7_170 = torch.constant.int 7
%int4800_171 = torch.constant.int 4800
%791 = torch.prim.ListConstruct %int1_169, %int7_170, %int4800_171 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%792 = torch.aten.reshape %789, %791 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%793 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%794 = torch.prim.tolist(%793) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_172 = torch.constant.int 2
%795 = torch.aten.split_with_sizes %792, %794, %int2_172 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%796:3 = torch.prim.ListUnpack %795 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%797 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_173 = torch.constant.int 1
%int7_174 = torch.constant.int 7
%int25_175 = torch.constant.int 25
%int64_176 = torch.constant.int 64
%798 = torch.prim.ListConstruct %int1_173, %int7_174, %int25_175, %int64_176 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%799 = torch.aten.reshape %796#0, %798 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_177 = torch.constant.int 1
%int2_178 = torch.constant.int 2
%800 = torch.aten.transpose.int %799, %int1_177, %int2_178 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%801 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_179 = torch.constant.int 1
%int7_180 = torch.constant.int 7
%int25_181 = torch.constant.int 25
%int64_182 = torch.constant.int 64
%802 = torch.prim.ListConstruct %int1_179, %int7_180, %int25_181, %int64_182 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%803 = torch.aten.reshape %796#1, %802 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_183 = torch.constant.int 1
%int2_184 = torch.constant.int 2
%804 = torch.aten.transpose.int %803, %int1_183, %int2_184 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%805 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_185 = torch.constant.int 1
%int7_186 = torch.constant.int 7
%int25_187 = torch.constant.int 25
%int64_188 = torch.constant.int 64
%806 = torch.prim.ListConstruct %int1_185, %int7_186, %int25_187, %int64_188 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%807 = torch.aten.reshape %796#2, %806 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_189 = torch.constant.int 1
%int2_190 = torch.constant.int 2
%808 = torch.aten.transpose.int %807, %int1_189, %int2_190 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_191 = torch.constant.int 1
%int2_192 = torch.constant.int 2
%809 = torch.aten.transpose.int %803, %int1_191, %int2_192 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_193 = torch.constant.int 2
%int3_194 = torch.constant.int 3
%810 = torch.aten.transpose.int %809, %int2_193, %int3_194 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%811 = torch.aten.matmul %800, %810 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%812 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%813 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%814 = torch.aten.pow.Tensor_Tensor %812, %813 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%815 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_195 = torch.constant.int 0
%816 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_196 = torch.constant.none
%float0.000000e00_197 = torch.constant.float 0.000000e+00
%817 = torch.aten.full %816, %float0.000000e00_197, %none_196, %none_196, %none_196, %none_196 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_198 = torch.constant.int 1
%818 = torch.aten.add.Tensor %817, %814, %int1_198 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%819 = torch.aten.div.Tensor %811, %818 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%820 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_199 = torch.constant.int 6
%none_200 = torch.constant.none
%false_201 = torch.constant.bool false
%821 = torch.aten.to.dtype %819, %int6_199, %false_201, %false_201, %none_200 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%822 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%823 = torch.aten.where.self %820, %821, %822 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_202 = torch.constant.int 3
%none_203 = torch.constant.none
%824 = torch.aten.softmax.int %823, %int3_202, %none_203 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_204 = torch.constant.int 6
%none_205 = torch.constant.none
%false_206 = torch.constant.bool false
%825 = torch.aten.to.dtype %824, %int6_204, %false_206, %false_206, %none_205 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%826 = torch.aten.matmul %825, %808 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_207 = torch.constant.int 1
%int2_208 = torch.constant.int 2
%827 = torch.aten.transpose.int %826, %int1_207, %int2_208 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%828 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_209 = torch.constant.int 1
%int7_210 = torch.constant.int 7
%int1600_211 = torch.constant.int 1600
%829 = torch.prim.ListConstruct %int1_209, %int7_210, %int1600_211 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%830 = torch.aten.reshape %827, %829 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%831 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_212 = torch.constant.int 7
%int1600_213 = torch.constant.int 1600
%832 = torch.prim.ListConstruct %int7_212, %int1600_213 : (!torch.int, !torch.int) -> !torch.list<int>
%833 = torch.aten.reshape %830, %832 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_214 = torch.constant.int 0
%int1_215 = torch.constant.int 1
%834 = torch.aten.mm %833, %30 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%835 = torch.aten.add.Tensor %834, %31, %int1_215 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%836 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_216 = torch.constant.int 1
%int7_217 = torch.constant.int 7
%int1600_218 = torch.constant.int 1600
%837 = torch.prim.ListConstruct %int1_216, %int7_217, %int1600_218 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%838 = torch.aten.reshape %835, %837 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_219 = torch.constant.int 1
%839 = torch.aten.add.Tensor %838, %783, %int1_219 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_220 = torch.constant.float 9.9999997473787516E-6
%int1600_221 = torch.constant.int 1600
%840 = torch.prim.ListConstruct %int1600_221 : (!torch.int) -> !torch.list<int>
%result0_222, %result1_223, %result2_224 = torch.aten.native_layer_norm %839, %840, %32, %33, %float9.999990e-06_220 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%841 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_225 = torch.constant.int 7
%int1600_226 = torch.constant.int 1600
%842 = torch.prim.ListConstruct %int7_225, %int1600_226 : (!torch.int, !torch.int) -> !torch.list<int>
%843 = torch.aten.reshape %result0_222, %842 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_227 = torch.constant.int 0
%int1_228 = torch.constant.int 1
%844 = torch.aten.mm %843, %34 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%845 = torch.aten.add.Tensor %844, %35, %int1_228 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%846 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_229 = torch.constant.int 1
%int7_230 = torch.constant.int 7
%int6400_231 = torch.constant.int 6400
%847 = torch.prim.ListConstruct %int1_229, %int7_230, %int6400_231 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%848 = torch.aten.reshape %845, %847 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%849 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%850 = torch.aten.mul.Tensor %848, %849 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%851 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%852 = torch.aten.pow.Tensor_Tensor %848, %851 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%853 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%854 = torch.aten.mul.Tensor %852, %853 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_232 = torch.constant.int 1
%855 = torch.aten.add.Tensor %848, %854, %int1_232 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%856 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%857 = torch.aten.mul.Tensor %855, %856 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%858 = torch.aten.tanh %857 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%859 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_233 = torch.constant.int 1
%860 = torch.aten.add.Tensor %858, %859, %int1_233 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%861 = torch.aten.mul.Tensor %850, %860 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%862 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_234 = torch.constant.int 7
%int6400_235 = torch.constant.int 6400
%863 = torch.prim.ListConstruct %int7_234, %int6400_235 : (!torch.int, !torch.int) -> !torch.list<int>
%864 = torch.aten.reshape %861, %863 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_236 = torch.constant.int 0
%int1_237 = torch.constant.int 1
%865 = torch.aten.mm %864, %36 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%866 = torch.aten.add.Tensor %865, %37, %int1_237 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%867 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_238 = torch.constant.int 1
%int7_239 = torch.constant.int 7
%int1600_240 = torch.constant.int 1600
%868 = torch.prim.ListConstruct %int1_238, %int7_239, %int1600_240 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%869 = torch.aten.reshape %866, %868 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_241 = torch.constant.int 1
%870 = torch.aten.add.Tensor %839, %869, %int1_241 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_242 = torch.constant.float 9.9999997473787516E-6
%int1600_243 = torch.constant.int 1600
%871 = torch.prim.ListConstruct %int1600_243 : (!torch.int) -> !torch.list<int>
%result0_244, %result1_245, %result2_246 = torch.aten.native_layer_norm %870, %871, %38, %39, %float9.999990e-06_242 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%872 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_247 = torch.constant.int 7
%int1600_248 = torch.constant.int 1600
%873 = torch.prim.ListConstruct %int7_247, %int1600_248 : (!torch.int, !torch.int) -> !torch.list<int>
%874 = torch.aten.reshape %result0_244, %873 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_249 = torch.constant.int 0
%int1_250 = torch.constant.int 1
%875 = torch.aten.mm %874, %40 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%876 = torch.aten.add.Tensor %875, %41, %int1_250 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%877 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_251 = torch.constant.int 1
%int7_252 = torch.constant.int 7
%int4800_253 = torch.constant.int 4800
%878 = torch.prim.ListConstruct %int1_251, %int7_252, %int4800_253 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%879 = torch.aten.reshape %876, %878 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%880 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%881 = torch.prim.tolist(%880) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_254 = torch.constant.int 2
%882 = torch.aten.split_with_sizes %879, %881, %int2_254 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%883:3 = torch.prim.ListUnpack %882 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%884 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_255 = torch.constant.int 1
%int7_256 = torch.constant.int 7
%int25_257 = torch.constant.int 25
%int64_258 = torch.constant.int 64
%885 = torch.prim.ListConstruct %int1_255, %int7_256, %int25_257, %int64_258 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%886 = torch.aten.reshape %883#0, %885 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_259 = torch.constant.int 1
%int2_260 = torch.constant.int 2
%887 = torch.aten.transpose.int %886, %int1_259, %int2_260 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%888 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_261 = torch.constant.int 1
%int7_262 = torch.constant.int 7
%int25_263 = torch.constant.int 25
%int64_264 = torch.constant.int 64
%889 = torch.prim.ListConstruct %int1_261, %int7_262, %int25_263, %int64_264 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%890 = torch.aten.reshape %883#1, %889 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_265 = torch.constant.int 1
%int2_266 = torch.constant.int 2
%891 = torch.aten.transpose.int %890, %int1_265, %int2_266 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%892 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_267 = torch.constant.int 1
%int7_268 = torch.constant.int 7
%int25_269 = torch.constant.int 25
%int64_270 = torch.constant.int 64
%893 = torch.prim.ListConstruct %int1_267, %int7_268, %int25_269, %int64_270 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%894 = torch.aten.reshape %883#2, %893 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_271 = torch.constant.int 1
%int2_272 = torch.constant.int 2
%895 = torch.aten.transpose.int %894, %int1_271, %int2_272 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_273 = torch.constant.int 1
%int2_274 = torch.constant.int 2
%896 = torch.aten.transpose.int %890, %int1_273, %int2_274 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_275 = torch.constant.int 2
%int3_276 = torch.constant.int 3
%897 = torch.aten.transpose.int %896, %int2_275, %int3_276 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%898 = torch.aten.matmul %887, %897 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%899 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%900 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%901 = torch.aten.pow.Tensor_Tensor %899, %900 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%902 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_277 = torch.constant.int 0
%903 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_278 = torch.constant.none
%float0.000000e00_279 = torch.constant.float 0.000000e+00
%904 = torch.aten.full %903, %float0.000000e00_279, %none_278, %none_278, %none_278, %none_278 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_280 = torch.constant.int 1
%905 = torch.aten.add.Tensor %904, %901, %int1_280 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%906 = torch.aten.div.Tensor %898, %905 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%907 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_281 = torch.constant.int 6
%none_282 = torch.constant.none
%false_283 = torch.constant.bool false
%908 = torch.aten.to.dtype %906, %int6_281, %false_283, %false_283, %none_282 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%909 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%910 = torch.aten.where.self %907, %908, %909 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_284 = torch.constant.int 3
%none_285 = torch.constant.none
%911 = torch.aten.softmax.int %910, %int3_284, %none_285 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_286 = torch.constant.int 6
%none_287 = torch.constant.none
%false_288 = torch.constant.bool false
%912 = torch.aten.to.dtype %911, %int6_286, %false_288, %false_288, %none_287 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%913 = torch.aten.matmul %912, %895 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_289 = torch.constant.int 1
%int2_290 = torch.constant.int 2
%914 = torch.aten.transpose.int %913, %int1_289, %int2_290 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%915 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_291 = torch.constant.int 1
%int7_292 = torch.constant.int 7
%int1600_293 = torch.constant.int 1600
%916 = torch.prim.ListConstruct %int1_291, %int7_292, %int1600_293 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%917 = torch.aten.reshape %914, %916 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%918 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_294 = torch.constant.int 7
%int1600_295 = torch.constant.int 1600
%919 = torch.prim.ListConstruct %int7_294, %int1600_295 : (!torch.int, !torch.int) -> !torch.list<int>
%920 = torch.aten.reshape %917, %919 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_296 = torch.constant.int 0
%int1_297 = torch.constant.int 1
%921 = torch.aten.mm %920, %42 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%922 = torch.aten.add.Tensor %921, %43, %int1_297 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%923 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_298 = torch.constant.int 1
%int7_299 = torch.constant.int 7
%int1600_300 = torch.constant.int 1600
%924 = torch.prim.ListConstruct %int1_298, %int7_299, %int1600_300 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%925 = torch.aten.reshape %922, %924 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_301 = torch.constant.int 1
%926 = torch.aten.add.Tensor %925, %870, %int1_301 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_302 = torch.constant.float 9.9999997473787516E-6
%int1600_303 = torch.constant.int 1600
%927 = torch.prim.ListConstruct %int1600_303 : (!torch.int) -> !torch.list<int>
%result0_304, %result1_305, %result2_306 = torch.aten.native_layer_norm %926, %927, %44, %45, %float9.999990e-06_302 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%928 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_307 = torch.constant.int 7
%int1600_308 = torch.constant.int 1600
%929 = torch.prim.ListConstruct %int7_307, %int1600_308 : (!torch.int, !torch.int) -> !torch.list<int>
%930 = torch.aten.reshape %result0_304, %929 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_309 = torch.constant.int 0
%int1_310 = torch.constant.int 1
%931 = torch.aten.mm %930, %46 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%932 = torch.aten.add.Tensor %931, %47, %int1_310 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%933 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_311 = torch.constant.int 1
%int7_312 = torch.constant.int 7
%int6400_313 = torch.constant.int 6400
%934 = torch.prim.ListConstruct %int1_311, %int7_312, %int6400_313 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%935 = torch.aten.reshape %932, %934 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%936 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%937 = torch.aten.mul.Tensor %935, %936 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%938 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%939 = torch.aten.pow.Tensor_Tensor %935, %938 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%940 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%941 = torch.aten.mul.Tensor %939, %940 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_314 = torch.constant.int 1
%942 = torch.aten.add.Tensor %935, %941, %int1_314 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%943 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%944 = torch.aten.mul.Tensor %942, %943 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%945 = torch.aten.tanh %944 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%946 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_315 = torch.constant.int 1
%947 = torch.aten.add.Tensor %945, %946, %int1_315 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%948 = torch.aten.mul.Tensor %937, %947 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%949 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_316 = torch.constant.int 7
%int6400_317 = torch.constant.int 6400
%950 = torch.prim.ListConstruct %int7_316, %int6400_317 : (!torch.int, !torch.int) -> !torch.list<int>
%951 = torch.aten.reshape %948, %950 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_318 = torch.constant.int 0
%int1_319 = torch.constant.int 1
%952 = torch.aten.mm %951, %48 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%953 = torch.aten.add.Tensor %952, %49, %int1_319 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%954 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_320 = torch.constant.int 1
%int7_321 = torch.constant.int 7
%int1600_322 = torch.constant.int 1600
%955 = torch.prim.ListConstruct %int1_320, %int7_321, %int1600_322 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%956 = torch.aten.reshape %953, %955 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_323 = torch.constant.int 1
%957 = torch.aten.add.Tensor %926, %956, %int1_323 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_324 = torch.constant.float 9.9999997473787516E-6
%int1600_325 = torch.constant.int 1600
%958 = torch.prim.ListConstruct %int1600_325 : (!torch.int) -> !torch.list<int>
%result0_326, %result1_327, %result2_328 = torch.aten.native_layer_norm %957, %958, %50, %51, %float9.999990e-06_324 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%959 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_329 = torch.constant.int 7
%int1600_330 = torch.constant.int 1600
%960 = torch.prim.ListConstruct %int7_329, %int1600_330 : (!torch.int, !torch.int) -> !torch.list<int>
%961 = torch.aten.reshape %result0_326, %960 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_331 = torch.constant.int 0
%int1_332 = torch.constant.int 1
%962 = torch.aten.mm %961, %52 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%963 = torch.aten.add.Tensor %962, %53, %int1_332 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%964 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_333 = torch.constant.int 1
%int7_334 = torch.constant.int 7
%int4800_335 = torch.constant.int 4800
%965 = torch.prim.ListConstruct %int1_333, %int7_334, %int4800_335 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%966 = torch.aten.reshape %963, %965 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%967 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%968 = torch.prim.tolist(%967) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_336 = torch.constant.int 2
%969 = torch.aten.split_with_sizes %966, %968, %int2_336 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%970:3 = torch.prim.ListUnpack %969 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%971 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_337 = torch.constant.int 1
%int7_338 = torch.constant.int 7
%int25_339 = torch.constant.int 25
%int64_340 = torch.constant.int 64
%972 = torch.prim.ListConstruct %int1_337, %int7_338, %int25_339, %int64_340 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%973 = torch.aten.reshape %970#0, %972 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_341 = torch.constant.int 1
%int2_342 = torch.constant.int 2
%974 = torch.aten.transpose.int %973, %int1_341, %int2_342 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%975 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_343 = torch.constant.int 1
%int7_344 = torch.constant.int 7
%int25_345 = torch.constant.int 25
%int64_346 = torch.constant.int 64
%976 = torch.prim.ListConstruct %int1_343, %int7_344, %int25_345, %int64_346 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%977 = torch.aten.reshape %970#1, %976 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_347 = torch.constant.int 1
%int2_348 = torch.constant.int 2
%978 = torch.aten.transpose.int %977, %int1_347, %int2_348 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%979 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_349 = torch.constant.int 1
%int7_350 = torch.constant.int 7
%int25_351 = torch.constant.int 25
%int64_352 = torch.constant.int 64
%980 = torch.prim.ListConstruct %int1_349, %int7_350, %int25_351, %int64_352 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%981 = torch.aten.reshape %970#2, %980 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_353 = torch.constant.int 1
%int2_354 = torch.constant.int 2
%982 = torch.aten.transpose.int %981, %int1_353, %int2_354 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_355 = torch.constant.int 1
%int2_356 = torch.constant.int 2
%983 = torch.aten.transpose.int %977, %int1_355, %int2_356 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_357 = torch.constant.int 2
%int3_358 = torch.constant.int 3
%984 = torch.aten.transpose.int %983, %int2_357, %int3_358 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%985 = torch.aten.matmul %974, %984 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%986 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%987 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%988 = torch.aten.pow.Tensor_Tensor %986, %987 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%989 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_359 = torch.constant.int 0
%990 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_360 = torch.constant.none
%float0.000000e00_361 = torch.constant.float 0.000000e+00
%991 = torch.aten.full %990, %float0.000000e00_361, %none_360, %none_360, %none_360, %none_360 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_362 = torch.constant.int 1
%992 = torch.aten.add.Tensor %991, %988, %int1_362 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%993 = torch.aten.div.Tensor %985, %992 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%994 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_363 = torch.constant.int 6
%none_364 = torch.constant.none
%false_365 = torch.constant.bool false
%995 = torch.aten.to.dtype %993, %int6_363, %false_365, %false_365, %none_364 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%996 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%997 = torch.aten.where.self %994, %995, %996 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_366 = torch.constant.int 3
%none_367 = torch.constant.none
%998 = torch.aten.softmax.int %997, %int3_366, %none_367 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_368 = torch.constant.int 6
%none_369 = torch.constant.none
%false_370 = torch.constant.bool false
%999 = torch.aten.to.dtype %998, %int6_368, %false_370, %false_370, %none_369 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1000 = torch.aten.matmul %999, %982 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_371 = torch.constant.int 1
%int2_372 = torch.constant.int 2
%1001 = torch.aten.transpose.int %1000, %int1_371, %int2_372 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1002 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_373 = torch.constant.int 1
%int7_374 = torch.constant.int 7
%int1600_375 = torch.constant.int 1600
%1003 = torch.prim.ListConstruct %int1_373, %int7_374, %int1600_375 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1004 = torch.aten.reshape %1001, %1003 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1005 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_376 = torch.constant.int 7
%int1600_377 = torch.constant.int 1600
%1006 = torch.prim.ListConstruct %int7_376, %int1600_377 : (!torch.int, !torch.int) -> !torch.list<int>
%1007 = torch.aten.reshape %1004, %1006 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_378 = torch.constant.int 0
%int1_379 = torch.constant.int 1
%1008 = torch.aten.mm %1007, %54 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1009 = torch.aten.add.Tensor %1008, %55, %int1_379 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1010 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_380 = torch.constant.int 1
%int7_381 = torch.constant.int 7
%int1600_382 = torch.constant.int 1600
%1011 = torch.prim.ListConstruct %int1_380, %int7_381, %int1600_382 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1012 = torch.aten.reshape %1009, %1011 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_383 = torch.constant.int 1
%1013 = torch.aten.add.Tensor %1012, %957, %int1_383 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_384 = torch.constant.float 9.9999997473787516E-6
%int1600_385 = torch.constant.int 1600
%1014 = torch.prim.ListConstruct %int1600_385 : (!torch.int) -> !torch.list<int>
%result0_386, %result1_387, %result2_388 = torch.aten.native_layer_norm %1013, %1014, %56, %57, %float9.999990e-06_384 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1015 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_389 = torch.constant.int 7
%int1600_390 = torch.constant.int 1600
%1016 = torch.prim.ListConstruct %int7_389, %int1600_390 : (!torch.int, !torch.int) -> !torch.list<int>
%1017 = torch.aten.reshape %result0_386, %1016 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_391 = torch.constant.int 0
%int1_392 = torch.constant.int 1
%1018 = torch.aten.mm %1017, %58 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1019 = torch.aten.add.Tensor %1018, %59, %int1_392 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1020 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_393 = torch.constant.int 1
%int7_394 = torch.constant.int 7
%int6400_395 = torch.constant.int 6400
%1021 = torch.prim.ListConstruct %int1_393, %int7_394, %int6400_395 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1022 = torch.aten.reshape %1019, %1021 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1023 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1024 = torch.aten.mul.Tensor %1022, %1023 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1025 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1026 = torch.aten.pow.Tensor_Tensor %1022, %1025 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1027 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1028 = torch.aten.mul.Tensor %1026, %1027 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_396 = torch.constant.int 1
%1029 = torch.aten.add.Tensor %1022, %1028, %int1_396 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1030 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1031 = torch.aten.mul.Tensor %1029, %1030 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1032 = torch.aten.tanh %1031 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1033 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_397 = torch.constant.int 1
%1034 = torch.aten.add.Tensor %1032, %1033, %int1_397 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1035 = torch.aten.mul.Tensor %1024, %1034 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1036 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_398 = torch.constant.int 7
%int6400_399 = torch.constant.int 6400
%1037 = torch.prim.ListConstruct %int7_398, %int6400_399 : (!torch.int, !torch.int) -> !torch.list<int>
%1038 = torch.aten.reshape %1035, %1037 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_400 = torch.constant.int 0
%int1_401 = torch.constant.int 1
%1039 = torch.aten.mm %1038, %60 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1040 = torch.aten.add.Tensor %1039, %61, %int1_401 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1041 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_402 = torch.constant.int 1
%int7_403 = torch.constant.int 7
%int1600_404 = torch.constant.int 1600
%1042 = torch.prim.ListConstruct %int1_402, %int7_403, %int1600_404 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1043 = torch.aten.reshape %1040, %1042 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_405 = torch.constant.int 1
%1044 = torch.aten.add.Tensor %1013, %1043, %int1_405 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_406 = torch.constant.float 9.9999997473787516E-6
%int1600_407 = torch.constant.int 1600
%1045 = torch.prim.ListConstruct %int1600_407 : (!torch.int) -> !torch.list<int>
%result0_408, %result1_409, %result2_410 = torch.aten.native_layer_norm %1044, %1045, %62, %63, %float9.999990e-06_406 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1046 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_411 = torch.constant.int 7
%int1600_412 = torch.constant.int 1600
%1047 = torch.prim.ListConstruct %int7_411, %int1600_412 : (!torch.int, !torch.int) -> !torch.list<int>
%1048 = torch.aten.reshape %result0_408, %1047 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_413 = torch.constant.int 0
%int1_414 = torch.constant.int 1
%1049 = torch.aten.mm %1048, %64 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1050 = torch.aten.add.Tensor %1049, %65, %int1_414 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1051 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_415 = torch.constant.int 1
%int7_416 = torch.constant.int 7
%int4800_417 = torch.constant.int 4800
%1052 = torch.prim.ListConstruct %int1_415, %int7_416, %int4800_417 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1053 = torch.aten.reshape %1050, %1052 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1054 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1055 = torch.prim.tolist(%1054) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_418 = torch.constant.int 2
%1056 = torch.aten.split_with_sizes %1053, %1055, %int2_418 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1057:3 = torch.prim.ListUnpack %1056 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1058 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_419 = torch.constant.int 1
%int7_420 = torch.constant.int 7
%int25_421 = torch.constant.int 25
%int64_422 = torch.constant.int 64
%1059 = torch.prim.ListConstruct %int1_419, %int7_420, %int25_421, %int64_422 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1060 = torch.aten.reshape %1057#0, %1059 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_423 = torch.constant.int 1
%int2_424 = torch.constant.int 2
%1061 = torch.aten.transpose.int %1060, %int1_423, %int2_424 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1062 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_425 = torch.constant.int 1
%int7_426 = torch.constant.int 7
%int25_427 = torch.constant.int 25
%int64_428 = torch.constant.int 64
%1063 = torch.prim.ListConstruct %int1_425, %int7_426, %int25_427, %int64_428 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1064 = torch.aten.reshape %1057#1, %1063 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_429 = torch.constant.int 1
%int2_430 = torch.constant.int 2
%1065 = torch.aten.transpose.int %1064, %int1_429, %int2_430 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1066 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_431 = torch.constant.int 1
%int7_432 = torch.constant.int 7
%int25_433 = torch.constant.int 25
%int64_434 = torch.constant.int 64
%1067 = torch.prim.ListConstruct %int1_431, %int7_432, %int25_433, %int64_434 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1068 = torch.aten.reshape %1057#2, %1067 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_435 = torch.constant.int 1
%int2_436 = torch.constant.int 2
%1069 = torch.aten.transpose.int %1068, %int1_435, %int2_436 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_437 = torch.constant.int 1
%int2_438 = torch.constant.int 2
%1070 = torch.aten.transpose.int %1064, %int1_437, %int2_438 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_439 = torch.constant.int 2
%int3_440 = torch.constant.int 3
%1071 = torch.aten.transpose.int %1070, %int2_439, %int3_440 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1072 = torch.aten.matmul %1061, %1071 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1073 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1074 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1075 = torch.aten.pow.Tensor_Tensor %1073, %1074 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1076 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_441 = torch.constant.int 0
%1077 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_442 = torch.constant.none
%float0.000000e00_443 = torch.constant.float 0.000000e+00
%1078 = torch.aten.full %1077, %float0.000000e00_443, %none_442, %none_442, %none_442, %none_442 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_444 = torch.constant.int 1
%1079 = torch.aten.add.Tensor %1078, %1075, %int1_444 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1080 = torch.aten.div.Tensor %1072, %1079 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1081 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_445 = torch.constant.int 6
%none_446 = torch.constant.none
%false_447 = torch.constant.bool false
%1082 = torch.aten.to.dtype %1080, %int6_445, %false_447, %false_447, %none_446 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1083 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1084 = torch.aten.where.self %1081, %1082, %1083 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_448 = torch.constant.int 3
%none_449 = torch.constant.none
%1085 = torch.aten.softmax.int %1084, %int3_448, %none_449 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_450 = torch.constant.int 6
%none_451 = torch.constant.none
%false_452 = torch.constant.bool false
%1086 = torch.aten.to.dtype %1085, %int6_450, %false_452, %false_452, %none_451 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1087 = torch.aten.matmul %1086, %1069 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_453 = torch.constant.int 1
%int2_454 = torch.constant.int 2
%1088 = torch.aten.transpose.int %1087, %int1_453, %int2_454 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1089 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_455 = torch.constant.int 1
%int7_456 = torch.constant.int 7
%int1600_457 = torch.constant.int 1600
%1090 = torch.prim.ListConstruct %int1_455, %int7_456, %int1600_457 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1091 = torch.aten.reshape %1088, %1090 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1092 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_458 = torch.constant.int 7
%int1600_459 = torch.constant.int 1600
%1093 = torch.prim.ListConstruct %int7_458, %int1600_459 : (!torch.int, !torch.int) -> !torch.list<int>
%1094 = torch.aten.reshape %1091, %1093 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_460 = torch.constant.int 0
%int1_461 = torch.constant.int 1
%1095 = torch.aten.mm %1094, %66 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1096 = torch.aten.add.Tensor %1095, %67, %int1_461 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1097 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_462 = torch.constant.int 1
%int7_463 = torch.constant.int 7
%int1600_464 = torch.constant.int 1600
%1098 = torch.prim.ListConstruct %int1_462, %int7_463, %int1600_464 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1099 = torch.aten.reshape %1096, %1098 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_465 = torch.constant.int 1
%1100 = torch.aten.add.Tensor %1099, %1044, %int1_465 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_466 = torch.constant.float 9.9999997473787516E-6
%int1600_467 = torch.constant.int 1600
%1101 = torch.prim.ListConstruct %int1600_467 : (!torch.int) -> !torch.list<int>
%result0_468, %result1_469, %result2_470 = torch.aten.native_layer_norm %1100, %1101, %68, %69, %float9.999990e-06_466 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1102 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_471 = torch.constant.int 7
%int1600_472 = torch.constant.int 1600
%1103 = torch.prim.ListConstruct %int7_471, %int1600_472 : (!torch.int, !torch.int) -> !torch.list<int>
%1104 = torch.aten.reshape %result0_468, %1103 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_473 = torch.constant.int 0
%int1_474 = torch.constant.int 1
%1105 = torch.aten.mm %1104, %70 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1106 = torch.aten.add.Tensor %1105, %71, %int1_474 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1107 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_475 = torch.constant.int 1
%int7_476 = torch.constant.int 7
%int6400_477 = torch.constant.int 6400
%1108 = torch.prim.ListConstruct %int1_475, %int7_476, %int6400_477 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1109 = torch.aten.reshape %1106, %1108 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1110 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1111 = torch.aten.mul.Tensor %1109, %1110 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1112 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1113 = torch.aten.pow.Tensor_Tensor %1109, %1112 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1114 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1115 = torch.aten.mul.Tensor %1113, %1114 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_478 = torch.constant.int 1
%1116 = torch.aten.add.Tensor %1109, %1115, %int1_478 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1117 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1118 = torch.aten.mul.Tensor %1116, %1117 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1119 = torch.aten.tanh %1118 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1120 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_479 = torch.constant.int 1
%1121 = torch.aten.add.Tensor %1119, %1120, %int1_479 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1122 = torch.aten.mul.Tensor %1111, %1121 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1123 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_480 = torch.constant.int 7
%int6400_481 = torch.constant.int 6400
%1124 = torch.prim.ListConstruct %int7_480, %int6400_481 : (!torch.int, !torch.int) -> !torch.list<int>
%1125 = torch.aten.reshape %1122, %1124 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_482 = torch.constant.int 0
%int1_483 = torch.constant.int 1
%1126 = torch.aten.mm %1125, %72 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1127 = torch.aten.add.Tensor %1126, %73, %int1_483 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1128 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_484 = torch.constant.int 1
%int7_485 = torch.constant.int 7
%int1600_486 = torch.constant.int 1600
%1129 = torch.prim.ListConstruct %int1_484, %int7_485, %int1600_486 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1130 = torch.aten.reshape %1127, %1129 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_487 = torch.constant.int 1
%1131 = torch.aten.add.Tensor %1100, %1130, %int1_487 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_488 = torch.constant.float 9.9999997473787516E-6
%int1600_489 = torch.constant.int 1600
%1132 = torch.prim.ListConstruct %int1600_489 : (!torch.int) -> !torch.list<int>
%result0_490, %result1_491, %result2_492 = torch.aten.native_layer_norm %1131, %1132, %74, %75, %float9.999990e-06_488 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1133 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_493 = torch.constant.int 7
%int1600_494 = torch.constant.int 1600
%1134 = torch.prim.ListConstruct %int7_493, %int1600_494 : (!torch.int, !torch.int) -> !torch.list<int>
%1135 = torch.aten.reshape %result0_490, %1134 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_495 = torch.constant.int 0
%int1_496 = torch.constant.int 1
%1136 = torch.aten.mm %1135, %76 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1137 = torch.aten.add.Tensor %1136, %77, %int1_496 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1138 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_497 = torch.constant.int 1
%int7_498 = torch.constant.int 7
%int4800_499 = torch.constant.int 4800
%1139 = torch.prim.ListConstruct %int1_497, %int7_498, %int4800_499 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1140 = torch.aten.reshape %1137, %1139 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1141 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1142 = torch.prim.tolist(%1141) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_500 = torch.constant.int 2
%1143 = torch.aten.split_with_sizes %1140, %1142, %int2_500 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1144:3 = torch.prim.ListUnpack %1143 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1145 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_501 = torch.constant.int 1
%int7_502 = torch.constant.int 7
%int25_503 = torch.constant.int 25
%int64_504 = torch.constant.int 64
%1146 = torch.prim.ListConstruct %int1_501, %int7_502, %int25_503, %int64_504 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1147 = torch.aten.reshape %1144#0, %1146 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_505 = torch.constant.int 1
%int2_506 = torch.constant.int 2
%1148 = torch.aten.transpose.int %1147, %int1_505, %int2_506 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1149 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_507 = torch.constant.int 1
%int7_508 = torch.constant.int 7
%int25_509 = torch.constant.int 25
%int64_510 = torch.constant.int 64
%1150 = torch.prim.ListConstruct %int1_507, %int7_508, %int25_509, %int64_510 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1151 = torch.aten.reshape %1144#1, %1150 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_511 = torch.constant.int 1
%int2_512 = torch.constant.int 2
%1152 = torch.aten.transpose.int %1151, %int1_511, %int2_512 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1153 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_513 = torch.constant.int 1
%int7_514 = torch.constant.int 7
%int25_515 = torch.constant.int 25
%int64_516 = torch.constant.int 64
%1154 = torch.prim.ListConstruct %int1_513, %int7_514, %int25_515, %int64_516 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1155 = torch.aten.reshape %1144#2, %1154 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_517 = torch.constant.int 1
%int2_518 = torch.constant.int 2
%1156 = torch.aten.transpose.int %1155, %int1_517, %int2_518 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_519 = torch.constant.int 1
%int2_520 = torch.constant.int 2
%1157 = torch.aten.transpose.int %1151, %int1_519, %int2_520 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_521 = torch.constant.int 2
%int3_522 = torch.constant.int 3
%1158 = torch.aten.transpose.int %1157, %int2_521, %int3_522 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1159 = torch.aten.matmul %1148, %1158 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1160 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1161 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1162 = torch.aten.pow.Tensor_Tensor %1160, %1161 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1163 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_523 = torch.constant.int 0
%1164 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_524 = torch.constant.none
%float0.000000e00_525 = torch.constant.float 0.000000e+00
%1165 = torch.aten.full %1164, %float0.000000e00_525, %none_524, %none_524, %none_524, %none_524 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_526 = torch.constant.int 1
%1166 = torch.aten.add.Tensor %1165, %1162, %int1_526 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1167 = torch.aten.div.Tensor %1159, %1166 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1168 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_527 = torch.constant.int 6
%none_528 = torch.constant.none
%false_529 = torch.constant.bool false
%1169 = torch.aten.to.dtype %1167, %int6_527, %false_529, %false_529, %none_528 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1170 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1171 = torch.aten.where.self %1168, %1169, %1170 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_530 = torch.constant.int 3
%none_531 = torch.constant.none
%1172 = torch.aten.softmax.int %1171, %int3_530, %none_531 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_532 = torch.constant.int 6
%none_533 = torch.constant.none
%false_534 = torch.constant.bool false
%1173 = torch.aten.to.dtype %1172, %int6_532, %false_534, %false_534, %none_533 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1174 = torch.aten.matmul %1173, %1156 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_535 = torch.constant.int 1
%int2_536 = torch.constant.int 2
%1175 = torch.aten.transpose.int %1174, %int1_535, %int2_536 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1176 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_537 = torch.constant.int 1
%int7_538 = torch.constant.int 7
%int1600_539 = torch.constant.int 1600
%1177 = torch.prim.ListConstruct %int1_537, %int7_538, %int1600_539 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1178 = torch.aten.reshape %1175, %1177 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1179 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_540 = torch.constant.int 7
%int1600_541 = torch.constant.int 1600
%1180 = torch.prim.ListConstruct %int7_540, %int1600_541 : (!torch.int, !torch.int) -> !torch.list<int>
%1181 = torch.aten.reshape %1178, %1180 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_542 = torch.constant.int 0
%int1_543 = torch.constant.int 1
%1182 = torch.aten.mm %1181, %78 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1183 = torch.aten.add.Tensor %1182, %79, %int1_543 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1184 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_544 = torch.constant.int 1
%int7_545 = torch.constant.int 7
%int1600_546 = torch.constant.int 1600
%1185 = torch.prim.ListConstruct %int1_544, %int7_545, %int1600_546 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1186 = torch.aten.reshape %1183, %1185 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_547 = torch.constant.int 1
%1187 = torch.aten.add.Tensor %1186, %1131, %int1_547 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_548 = torch.constant.float 9.9999997473787516E-6
%int1600_549 = torch.constant.int 1600
%1188 = torch.prim.ListConstruct %int1600_549 : (!torch.int) -> !torch.list<int>
%result0_550, %result1_551, %result2_552 = torch.aten.native_layer_norm %1187, %1188, %80, %81, %float9.999990e-06_548 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1189 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_553 = torch.constant.int 7
%int1600_554 = torch.constant.int 1600
%1190 = torch.prim.ListConstruct %int7_553, %int1600_554 : (!torch.int, !torch.int) -> !torch.list<int>
%1191 = torch.aten.reshape %result0_550, %1190 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_555 = torch.constant.int 0
%int1_556 = torch.constant.int 1
%1192 = torch.aten.mm %1191, %82 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1193 = torch.aten.add.Tensor %1192, %83, %int1_556 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1194 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_557 = torch.constant.int 1
%int7_558 = torch.constant.int 7
%int6400_559 = torch.constant.int 6400
%1195 = torch.prim.ListConstruct %int1_557, %int7_558, %int6400_559 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1196 = torch.aten.reshape %1193, %1195 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1197 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1198 = torch.aten.mul.Tensor %1196, %1197 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1199 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1200 = torch.aten.pow.Tensor_Tensor %1196, %1199 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1201 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1202 = torch.aten.mul.Tensor %1200, %1201 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_560 = torch.constant.int 1
%1203 = torch.aten.add.Tensor %1196, %1202, %int1_560 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1204 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1205 = torch.aten.mul.Tensor %1203, %1204 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1206 = torch.aten.tanh %1205 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1207 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_561 = torch.constant.int 1
%1208 = torch.aten.add.Tensor %1206, %1207, %int1_561 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1209 = torch.aten.mul.Tensor %1198, %1208 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1210 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_562 = torch.constant.int 7
%int6400_563 = torch.constant.int 6400
%1211 = torch.prim.ListConstruct %int7_562, %int6400_563 : (!torch.int, !torch.int) -> !torch.list<int>
%1212 = torch.aten.reshape %1209, %1211 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_564 = torch.constant.int 0
%int1_565 = torch.constant.int 1
%1213 = torch.aten.mm %1212, %84 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1214 = torch.aten.add.Tensor %1213, %85, %int1_565 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1215 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_566 = torch.constant.int 1
%int7_567 = torch.constant.int 7
%int1600_568 = torch.constant.int 1600
%1216 = torch.prim.ListConstruct %int1_566, %int7_567, %int1600_568 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1217 = torch.aten.reshape %1214, %1216 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_569 = torch.constant.int 1
%1218 = torch.aten.add.Tensor %1187, %1217, %int1_569 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_570 = torch.constant.float 9.9999997473787516E-6
%int1600_571 = torch.constant.int 1600
%1219 = torch.prim.ListConstruct %int1600_571 : (!torch.int) -> !torch.list<int>
%result0_572, %result1_573, %result2_574 = torch.aten.native_layer_norm %1218, %1219, %86, %87, %float9.999990e-06_570 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1220 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_575 = torch.constant.int 7
%int1600_576 = torch.constant.int 1600
%1221 = torch.prim.ListConstruct %int7_575, %int1600_576 : (!torch.int, !torch.int) -> !torch.list<int>
%1222 = torch.aten.reshape %result0_572, %1221 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_577 = torch.constant.int 0
%int1_578 = torch.constant.int 1
%1223 = torch.aten.mm %1222, %88 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1224 = torch.aten.add.Tensor %1223, %89, %int1_578 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1225 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_579 = torch.constant.int 1
%int7_580 = torch.constant.int 7
%int4800_581 = torch.constant.int 4800
%1226 = torch.prim.ListConstruct %int1_579, %int7_580, %int4800_581 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1227 = torch.aten.reshape %1224, %1226 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1228 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1229 = torch.prim.tolist(%1228) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_582 = torch.constant.int 2
%1230 = torch.aten.split_with_sizes %1227, %1229, %int2_582 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1231:3 = torch.prim.ListUnpack %1230 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1232 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_583 = torch.constant.int 1
%int7_584 = torch.constant.int 7
%int25_585 = torch.constant.int 25
%int64_586 = torch.constant.int 64
%1233 = torch.prim.ListConstruct %int1_583, %int7_584, %int25_585, %int64_586 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1234 = torch.aten.reshape %1231#0, %1233 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_587 = torch.constant.int 1
%int2_588 = torch.constant.int 2
%1235 = torch.aten.transpose.int %1234, %int1_587, %int2_588 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1236 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_589 = torch.constant.int 1
%int7_590 = torch.constant.int 7
%int25_591 = torch.constant.int 25
%int64_592 = torch.constant.int 64
%1237 = torch.prim.ListConstruct %int1_589, %int7_590, %int25_591, %int64_592 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1238 = torch.aten.reshape %1231#1, %1237 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_593 = torch.constant.int 1
%int2_594 = torch.constant.int 2
%1239 = torch.aten.transpose.int %1238, %int1_593, %int2_594 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1240 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_595 = torch.constant.int 1
%int7_596 = torch.constant.int 7
%int25_597 = torch.constant.int 25
%int64_598 = torch.constant.int 64
%1241 = torch.prim.ListConstruct %int1_595, %int7_596, %int25_597, %int64_598 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1242 = torch.aten.reshape %1231#2, %1241 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_599 = torch.constant.int 1
%int2_600 = torch.constant.int 2
%1243 = torch.aten.transpose.int %1242, %int1_599, %int2_600 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_601 = torch.constant.int 1
%int2_602 = torch.constant.int 2
%1244 = torch.aten.transpose.int %1238, %int1_601, %int2_602 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_603 = torch.constant.int 2
%int3_604 = torch.constant.int 3
%1245 = torch.aten.transpose.int %1244, %int2_603, %int3_604 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1246 = torch.aten.matmul %1235, %1245 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1247 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1248 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1249 = torch.aten.pow.Tensor_Tensor %1247, %1248 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1250 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_605 = torch.constant.int 0
%1251 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_606 = torch.constant.none
%float0.000000e00_607 = torch.constant.float 0.000000e+00
%1252 = torch.aten.full %1251, %float0.000000e00_607, %none_606, %none_606, %none_606, %none_606 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_608 = torch.constant.int 1
%1253 = torch.aten.add.Tensor %1252, %1249, %int1_608 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1254 = torch.aten.div.Tensor %1246, %1253 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1255 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_609 = torch.constant.int 6
%none_610 = torch.constant.none
%false_611 = torch.constant.bool false
%1256 = torch.aten.to.dtype %1254, %int6_609, %false_611, %false_611, %none_610 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1257 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1258 = torch.aten.where.self %1255, %1256, %1257 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_612 = torch.constant.int 3
%none_613 = torch.constant.none
%1259 = torch.aten.softmax.int %1258, %int3_612, %none_613 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_614 = torch.constant.int 6
%none_615 = torch.constant.none
%false_616 = torch.constant.bool false
%1260 = torch.aten.to.dtype %1259, %int6_614, %false_616, %false_616, %none_615 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1261 = torch.aten.matmul %1260, %1243 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_617 = torch.constant.int 1
%int2_618 = torch.constant.int 2
%1262 = torch.aten.transpose.int %1261, %int1_617, %int2_618 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1263 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_619 = torch.constant.int 1
%int7_620 = torch.constant.int 7
%int1600_621 = torch.constant.int 1600
%1264 = torch.prim.ListConstruct %int1_619, %int7_620, %int1600_621 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1265 = torch.aten.reshape %1262, %1264 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1266 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_622 = torch.constant.int 7
%int1600_623 = torch.constant.int 1600
%1267 = torch.prim.ListConstruct %int7_622, %int1600_623 : (!torch.int, !torch.int) -> !torch.list<int>
%1268 = torch.aten.reshape %1265, %1267 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_624 = torch.constant.int 0
%int1_625 = torch.constant.int 1
%1269 = torch.aten.mm %1268, %90 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1270 = torch.aten.add.Tensor %1269, %91, %int1_625 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1271 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_626 = torch.constant.int 1
%int7_627 = torch.constant.int 7
%int1600_628 = torch.constant.int 1600
%1272 = torch.prim.ListConstruct %int1_626, %int7_627, %int1600_628 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1273 = torch.aten.reshape %1270, %1272 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_629 = torch.constant.int 1
%1274 = torch.aten.add.Tensor %1273, %1218, %int1_629 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_630 = torch.constant.float 9.9999997473787516E-6
%int1600_631 = torch.constant.int 1600
%1275 = torch.prim.ListConstruct %int1600_631 : (!torch.int) -> !torch.list<int>
%result0_632, %result1_633, %result2_634 = torch.aten.native_layer_norm %1274, %1275, %92, %93, %float9.999990e-06_630 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1276 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_635 = torch.constant.int 7
%int1600_636 = torch.constant.int 1600
%1277 = torch.prim.ListConstruct %int7_635, %int1600_636 : (!torch.int, !torch.int) -> !torch.list<int>
%1278 = torch.aten.reshape %result0_632, %1277 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_637 = torch.constant.int 0
%int1_638 = torch.constant.int 1
%1279 = torch.aten.mm %1278, %94 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1280 = torch.aten.add.Tensor %1279, %95, %int1_638 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1281 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_639 = torch.constant.int 1
%int7_640 = torch.constant.int 7
%int6400_641 = torch.constant.int 6400
%1282 = torch.prim.ListConstruct %int1_639, %int7_640, %int6400_641 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1283 = torch.aten.reshape %1280, %1282 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1284 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1285 = torch.aten.mul.Tensor %1283, %1284 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1286 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1287 = torch.aten.pow.Tensor_Tensor %1283, %1286 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1288 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1289 = torch.aten.mul.Tensor %1287, %1288 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_642 = torch.constant.int 1
%1290 = torch.aten.add.Tensor %1283, %1289, %int1_642 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1291 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1292 = torch.aten.mul.Tensor %1290, %1291 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1293 = torch.aten.tanh %1292 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1294 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_643 = torch.constant.int 1
%1295 = torch.aten.add.Tensor %1293, %1294, %int1_643 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1296 = torch.aten.mul.Tensor %1285, %1295 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1297 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_644 = torch.constant.int 7
%int6400_645 = torch.constant.int 6400
%1298 = torch.prim.ListConstruct %int7_644, %int6400_645 : (!torch.int, !torch.int) -> !torch.list<int>
%1299 = torch.aten.reshape %1296, %1298 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_646 = torch.constant.int 0
%int1_647 = torch.constant.int 1
%1300 = torch.aten.mm %1299, %96 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1301 = torch.aten.add.Tensor %1300, %97, %int1_647 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1302 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_648 = torch.constant.int 1
%int7_649 = torch.constant.int 7
%int1600_650 = torch.constant.int 1600
%1303 = torch.prim.ListConstruct %int1_648, %int7_649, %int1600_650 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1304 = torch.aten.reshape %1301, %1303 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_651 = torch.constant.int 1
%1305 = torch.aten.add.Tensor %1274, %1304, %int1_651 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_652 = torch.constant.float 9.9999997473787516E-6
%int1600_653 = torch.constant.int 1600
%1306 = torch.prim.ListConstruct %int1600_653 : (!torch.int) -> !torch.list<int>
%result0_654, %result1_655, %result2_656 = torch.aten.native_layer_norm %1305, %1306, %98, %99, %float9.999990e-06_652 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1307 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_657 = torch.constant.int 7
%int1600_658 = torch.constant.int 1600
%1308 = torch.prim.ListConstruct %int7_657, %int1600_658 : (!torch.int, !torch.int) -> !torch.list<int>
%1309 = torch.aten.reshape %result0_654, %1308 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_659 = torch.constant.int 0
%int1_660 = torch.constant.int 1
%1310 = torch.aten.mm %1309, %100 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1311 = torch.aten.add.Tensor %1310, %101, %int1_660 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1312 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_661 = torch.constant.int 1
%int7_662 = torch.constant.int 7
%int4800_663 = torch.constant.int 4800
%1313 = torch.prim.ListConstruct %int1_661, %int7_662, %int4800_663 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1314 = torch.aten.reshape %1311, %1313 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1315 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1316 = torch.prim.tolist(%1315) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_664 = torch.constant.int 2
%1317 = torch.aten.split_with_sizes %1314, %1316, %int2_664 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1318:3 = torch.prim.ListUnpack %1317 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1319 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_665 = torch.constant.int 1
%int7_666 = torch.constant.int 7
%int25_667 = torch.constant.int 25
%int64_668 = torch.constant.int 64
%1320 = torch.prim.ListConstruct %int1_665, %int7_666, %int25_667, %int64_668 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1321 = torch.aten.reshape %1318#0, %1320 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_669 = torch.constant.int 1
%int2_670 = torch.constant.int 2
%1322 = torch.aten.transpose.int %1321, %int1_669, %int2_670 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1323 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_671 = torch.constant.int 1
%int7_672 = torch.constant.int 7
%int25_673 = torch.constant.int 25
%int64_674 = torch.constant.int 64
%1324 = torch.prim.ListConstruct %int1_671, %int7_672, %int25_673, %int64_674 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1325 = torch.aten.reshape %1318#1, %1324 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_675 = torch.constant.int 1
%int2_676 = torch.constant.int 2
%1326 = torch.aten.transpose.int %1325, %int1_675, %int2_676 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1327 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_677 = torch.constant.int 1
%int7_678 = torch.constant.int 7
%int25_679 = torch.constant.int 25
%int64_680 = torch.constant.int 64
%1328 = torch.prim.ListConstruct %int1_677, %int7_678, %int25_679, %int64_680 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1329 = torch.aten.reshape %1318#2, %1328 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_681 = torch.constant.int 1
%int2_682 = torch.constant.int 2
%1330 = torch.aten.transpose.int %1329, %int1_681, %int2_682 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_683 = torch.constant.int 1
%int2_684 = torch.constant.int 2
%1331 = torch.aten.transpose.int %1325, %int1_683, %int2_684 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_685 = torch.constant.int 2
%int3_686 = torch.constant.int 3
%1332 = torch.aten.transpose.int %1331, %int2_685, %int3_686 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1333 = torch.aten.matmul %1322, %1332 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1334 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1335 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1336 = torch.aten.pow.Tensor_Tensor %1334, %1335 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1337 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_687 = torch.constant.int 0
%1338 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_688 = torch.constant.none
%float0.000000e00_689 = torch.constant.float 0.000000e+00
%1339 = torch.aten.full %1338, %float0.000000e00_689, %none_688, %none_688, %none_688, %none_688 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_690 = torch.constant.int 1
%1340 = torch.aten.add.Tensor %1339, %1336, %int1_690 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1341 = torch.aten.div.Tensor %1333, %1340 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1342 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_691 = torch.constant.int 6
%none_692 = torch.constant.none
%false_693 = torch.constant.bool false
%1343 = torch.aten.to.dtype %1341, %int6_691, %false_693, %false_693, %none_692 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1344 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1345 = torch.aten.where.self %1342, %1343, %1344 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_694 = torch.constant.int 3
%none_695 = torch.constant.none
%1346 = torch.aten.softmax.int %1345, %int3_694, %none_695 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_696 = torch.constant.int 6
%none_697 = torch.constant.none
%false_698 = torch.constant.bool false
%1347 = torch.aten.to.dtype %1346, %int6_696, %false_698, %false_698, %none_697 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1348 = torch.aten.matmul %1347, %1330 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_699 = torch.constant.int 1
%int2_700 = torch.constant.int 2
%1349 = torch.aten.transpose.int %1348, %int1_699, %int2_700 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1350 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_701 = torch.constant.int 1
%int7_702 = torch.constant.int 7
%int1600_703 = torch.constant.int 1600
%1351 = torch.prim.ListConstruct %int1_701, %int7_702, %int1600_703 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1352 = torch.aten.reshape %1349, %1351 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1353 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_704 = torch.constant.int 7
%int1600_705 = torch.constant.int 1600
%1354 = torch.prim.ListConstruct %int7_704, %int1600_705 : (!torch.int, !torch.int) -> !torch.list<int>
%1355 = torch.aten.reshape %1352, %1354 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_706 = torch.constant.int 0
%int1_707 = torch.constant.int 1
%1356 = torch.aten.mm %1355, %102 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1357 = torch.aten.add.Tensor %1356, %103, %int1_707 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1358 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_708 = torch.constant.int 1
%int7_709 = torch.constant.int 7
%int1600_710 = torch.constant.int 1600
%1359 = torch.prim.ListConstruct %int1_708, %int7_709, %int1600_710 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1360 = torch.aten.reshape %1357, %1359 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_711 = torch.constant.int 1
%1361 = torch.aten.add.Tensor %1360, %1305, %int1_711 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_712 = torch.constant.float 9.9999997473787516E-6
%int1600_713 = torch.constant.int 1600
%1362 = torch.prim.ListConstruct %int1600_713 : (!torch.int) -> !torch.list<int>
%result0_714, %result1_715, %result2_716 = torch.aten.native_layer_norm %1361, %1362, %104, %105, %float9.999990e-06_712 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1363 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_717 = torch.constant.int 7
%int1600_718 = torch.constant.int 1600
%1364 = torch.prim.ListConstruct %int7_717, %int1600_718 : (!torch.int, !torch.int) -> !torch.list<int>
%1365 = torch.aten.reshape %result0_714, %1364 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_719 = torch.constant.int 0
%int1_720 = torch.constant.int 1
%1366 = torch.aten.mm %1365, %106 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1367 = torch.aten.add.Tensor %1366, %107, %int1_720 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1368 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_721 = torch.constant.int 1
%int7_722 = torch.constant.int 7
%int6400_723 = torch.constant.int 6400
%1369 = torch.prim.ListConstruct %int1_721, %int7_722, %int6400_723 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1370 = torch.aten.reshape %1367, %1369 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1371 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1372 = torch.aten.mul.Tensor %1370, %1371 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1373 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1374 = torch.aten.pow.Tensor_Tensor %1370, %1373 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1375 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1376 = torch.aten.mul.Tensor %1374, %1375 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_724 = torch.constant.int 1
%1377 = torch.aten.add.Tensor %1370, %1376, %int1_724 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1378 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1379 = torch.aten.mul.Tensor %1377, %1378 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1380 = torch.aten.tanh %1379 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1381 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_725 = torch.constant.int 1
%1382 = torch.aten.add.Tensor %1380, %1381, %int1_725 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1383 = torch.aten.mul.Tensor %1372, %1382 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1384 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_726 = torch.constant.int 7
%int6400_727 = torch.constant.int 6400
%1385 = torch.prim.ListConstruct %int7_726, %int6400_727 : (!torch.int, !torch.int) -> !torch.list<int>
%1386 = torch.aten.reshape %1383, %1385 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_728 = torch.constant.int 0
%int1_729 = torch.constant.int 1
%1387 = torch.aten.mm %1386, %108 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1388 = torch.aten.add.Tensor %1387, %109, %int1_729 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1389 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_730 = torch.constant.int 1
%int7_731 = torch.constant.int 7
%int1600_732 = torch.constant.int 1600
%1390 = torch.prim.ListConstruct %int1_730, %int7_731, %int1600_732 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1391 = torch.aten.reshape %1388, %1390 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_733 = torch.constant.int 1
%1392 = torch.aten.add.Tensor %1361, %1391, %int1_733 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_734 = torch.constant.float 9.9999997473787516E-6
%int1600_735 = torch.constant.int 1600
%1393 = torch.prim.ListConstruct %int1600_735 : (!torch.int) -> !torch.list<int>
%result0_736, %result1_737, %result2_738 = torch.aten.native_layer_norm %1392, %1393, %110, %111, %float9.999990e-06_734 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1394 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_739 = torch.constant.int 7
%int1600_740 = torch.constant.int 1600
%1395 = torch.prim.ListConstruct %int7_739, %int1600_740 : (!torch.int, !torch.int) -> !torch.list<int>
%1396 = torch.aten.reshape %result0_736, %1395 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_741 = torch.constant.int 0
%int1_742 = torch.constant.int 1
%1397 = torch.aten.mm %1396, %112 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1398 = torch.aten.add.Tensor %1397, %113, %int1_742 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1399 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_743 = torch.constant.int 1
%int7_744 = torch.constant.int 7
%int4800_745 = torch.constant.int 4800
%1400 = torch.prim.ListConstruct %int1_743, %int7_744, %int4800_745 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1401 = torch.aten.reshape %1398, %1400 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1402 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1403 = torch.prim.tolist(%1402) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_746 = torch.constant.int 2
%1404 = torch.aten.split_with_sizes %1401, %1403, %int2_746 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1405:3 = torch.prim.ListUnpack %1404 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1406 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_747 = torch.constant.int 1
%int7_748 = torch.constant.int 7
%int25_749 = torch.constant.int 25
%int64_750 = torch.constant.int 64
%1407 = torch.prim.ListConstruct %int1_747, %int7_748, %int25_749, %int64_750 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1408 = torch.aten.reshape %1405#0, %1407 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_751 = torch.constant.int 1
%int2_752 = torch.constant.int 2
%1409 = torch.aten.transpose.int %1408, %int1_751, %int2_752 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1410 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_753 = torch.constant.int 1
%int7_754 = torch.constant.int 7
%int25_755 = torch.constant.int 25
%int64_756 = torch.constant.int 64
%1411 = torch.prim.ListConstruct %int1_753, %int7_754, %int25_755, %int64_756 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1412 = torch.aten.reshape %1405#1, %1411 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_757 = torch.constant.int 1
%int2_758 = torch.constant.int 2
%1413 = torch.aten.transpose.int %1412, %int1_757, %int2_758 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1414 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_759 = torch.constant.int 1
%int7_760 = torch.constant.int 7
%int25_761 = torch.constant.int 25
%int64_762 = torch.constant.int 64
%1415 = torch.prim.ListConstruct %int1_759, %int7_760, %int25_761, %int64_762 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1416 = torch.aten.reshape %1405#2, %1415 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_763 = torch.constant.int 1
%int2_764 = torch.constant.int 2
%1417 = torch.aten.transpose.int %1416, %int1_763, %int2_764 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_765 = torch.constant.int 1
%int2_766 = torch.constant.int 2
%1418 = torch.aten.transpose.int %1412, %int1_765, %int2_766 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_767 = torch.constant.int 2
%int3_768 = torch.constant.int 3
%1419 = torch.aten.transpose.int %1418, %int2_767, %int3_768 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1420 = torch.aten.matmul %1409, %1419 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1421 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1422 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1423 = torch.aten.pow.Tensor_Tensor %1421, %1422 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1424 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_769 = torch.constant.int 0
%1425 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_770 = torch.constant.none
%float0.000000e00_771 = torch.constant.float 0.000000e+00
%1426 = torch.aten.full %1425, %float0.000000e00_771, %none_770, %none_770, %none_770, %none_770 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_772 = torch.constant.int 1
%1427 = torch.aten.add.Tensor %1426, %1423, %int1_772 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1428 = torch.aten.div.Tensor %1420, %1427 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1429 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_773 = torch.constant.int 6
%none_774 = torch.constant.none
%false_775 = torch.constant.bool false
%1430 = torch.aten.to.dtype %1428, %int6_773, %false_775, %false_775, %none_774 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1431 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1432 = torch.aten.where.self %1429, %1430, %1431 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_776 = torch.constant.int 3
%none_777 = torch.constant.none
%1433 = torch.aten.softmax.int %1432, %int3_776, %none_777 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_778 = torch.constant.int 6
%none_779 = torch.constant.none
%false_780 = torch.constant.bool false
%1434 = torch.aten.to.dtype %1433, %int6_778, %false_780, %false_780, %none_779 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1435 = torch.aten.matmul %1434, %1417 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_781 = torch.constant.int 1
%int2_782 = torch.constant.int 2
%1436 = torch.aten.transpose.int %1435, %int1_781, %int2_782 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1437 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_783 = torch.constant.int 1
%int7_784 = torch.constant.int 7
%int1600_785 = torch.constant.int 1600
%1438 = torch.prim.ListConstruct %int1_783, %int7_784, %int1600_785 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1439 = torch.aten.reshape %1436, %1438 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1440 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_786 = torch.constant.int 7
%int1600_787 = torch.constant.int 1600
%1441 = torch.prim.ListConstruct %int7_786, %int1600_787 : (!torch.int, !torch.int) -> !torch.list<int>
%1442 = torch.aten.reshape %1439, %1441 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_788 = torch.constant.int 0
%int1_789 = torch.constant.int 1
%1443 = torch.aten.mm %1442, %114 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1444 = torch.aten.add.Tensor %1443, %115, %int1_789 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1445 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_790 = torch.constant.int 1
%int7_791 = torch.constant.int 7
%int1600_792 = torch.constant.int 1600
%1446 = torch.prim.ListConstruct %int1_790, %int7_791, %int1600_792 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1447 = torch.aten.reshape %1444, %1446 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_793 = torch.constant.int 1
%1448 = torch.aten.add.Tensor %1447, %1392, %int1_793 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_794 = torch.constant.float 9.9999997473787516E-6
%int1600_795 = torch.constant.int 1600
%1449 = torch.prim.ListConstruct %int1600_795 : (!torch.int) -> !torch.list<int>
%result0_796, %result1_797, %result2_798 = torch.aten.native_layer_norm %1448, %1449, %116, %117, %float9.999990e-06_794 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1450 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_799 = torch.constant.int 7
%int1600_800 = torch.constant.int 1600
%1451 = torch.prim.ListConstruct %int7_799, %int1600_800 : (!torch.int, !torch.int) -> !torch.list<int>
%1452 = torch.aten.reshape %result0_796, %1451 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_801 = torch.constant.int 0
%int1_802 = torch.constant.int 1
%1453 = torch.aten.mm %1452, %118 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1454 = torch.aten.add.Tensor %1453, %119, %int1_802 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1455 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_803 = torch.constant.int 1
%int7_804 = torch.constant.int 7
%int6400_805 = torch.constant.int 6400
%1456 = torch.prim.ListConstruct %int1_803, %int7_804, %int6400_805 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1457 = torch.aten.reshape %1454, %1456 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1458 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1459 = torch.aten.mul.Tensor %1457, %1458 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1460 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1461 = torch.aten.pow.Tensor_Tensor %1457, %1460 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1462 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1463 = torch.aten.mul.Tensor %1461, %1462 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_806 = torch.constant.int 1
%1464 = torch.aten.add.Tensor %1457, %1463, %int1_806 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1465 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1466 = torch.aten.mul.Tensor %1464, %1465 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1467 = torch.aten.tanh %1466 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1468 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_807 = torch.constant.int 1
%1469 = torch.aten.add.Tensor %1467, %1468, %int1_807 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1470 = torch.aten.mul.Tensor %1459, %1469 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1471 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_808 = torch.constant.int 7
%int6400_809 = torch.constant.int 6400
%1472 = torch.prim.ListConstruct %int7_808, %int6400_809 : (!torch.int, !torch.int) -> !torch.list<int>
%1473 = torch.aten.reshape %1470, %1472 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_810 = torch.constant.int 0
%int1_811 = torch.constant.int 1
%1474 = torch.aten.mm %1473, %120 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1475 = torch.aten.add.Tensor %1474, %121, %int1_811 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1476 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_812 = torch.constant.int 1
%int7_813 = torch.constant.int 7
%int1600_814 = torch.constant.int 1600
%1477 = torch.prim.ListConstruct %int1_812, %int7_813, %int1600_814 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1478 = torch.aten.reshape %1475, %1477 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_815 = torch.constant.int 1
%1479 = torch.aten.add.Tensor %1448, %1478, %int1_815 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_816 = torch.constant.float 9.9999997473787516E-6
%int1600_817 = torch.constant.int 1600
%1480 = torch.prim.ListConstruct %int1600_817 : (!torch.int) -> !torch.list<int>
%result0_818, %result1_819, %result2_820 = torch.aten.native_layer_norm %1479, %1480, %122, %123, %float9.999990e-06_816 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1481 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_821 = torch.constant.int 7
%int1600_822 = torch.constant.int 1600
%1482 = torch.prim.ListConstruct %int7_821, %int1600_822 : (!torch.int, !torch.int) -> !torch.list<int>
%1483 = torch.aten.reshape %result0_818, %1482 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_823 = torch.constant.int 0
%int1_824 = torch.constant.int 1
%1484 = torch.aten.mm %1483, %124 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1485 = torch.aten.add.Tensor %1484, %125, %int1_824 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1486 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_825 = torch.constant.int 1
%int7_826 = torch.constant.int 7
%int4800_827 = torch.constant.int 4800
%1487 = torch.prim.ListConstruct %int1_825, %int7_826, %int4800_827 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1488 = torch.aten.reshape %1485, %1487 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1489 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1490 = torch.prim.tolist(%1489) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_828 = torch.constant.int 2
%1491 = torch.aten.split_with_sizes %1488, %1490, %int2_828 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1492:3 = torch.prim.ListUnpack %1491 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1493 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_829 = torch.constant.int 1
%int7_830 = torch.constant.int 7
%int25_831 = torch.constant.int 25
%int64_832 = torch.constant.int 64
%1494 = torch.prim.ListConstruct %int1_829, %int7_830, %int25_831, %int64_832 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1495 = torch.aten.reshape %1492#0, %1494 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_833 = torch.constant.int 1
%int2_834 = torch.constant.int 2
%1496 = torch.aten.transpose.int %1495, %int1_833, %int2_834 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1497 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_835 = torch.constant.int 1
%int7_836 = torch.constant.int 7
%int25_837 = torch.constant.int 25
%int64_838 = torch.constant.int 64
%1498 = torch.prim.ListConstruct %int1_835, %int7_836, %int25_837, %int64_838 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1499 = torch.aten.reshape %1492#1, %1498 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_839 = torch.constant.int 1
%int2_840 = torch.constant.int 2
%1500 = torch.aten.transpose.int %1499, %int1_839, %int2_840 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1501 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_841 = torch.constant.int 1
%int7_842 = torch.constant.int 7
%int25_843 = torch.constant.int 25
%int64_844 = torch.constant.int 64
%1502 = torch.prim.ListConstruct %int1_841, %int7_842, %int25_843, %int64_844 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1503 = torch.aten.reshape %1492#2, %1502 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_845 = torch.constant.int 1
%int2_846 = torch.constant.int 2
%1504 = torch.aten.transpose.int %1503, %int1_845, %int2_846 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_847 = torch.constant.int 1
%int2_848 = torch.constant.int 2
%1505 = torch.aten.transpose.int %1499, %int1_847, %int2_848 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_849 = torch.constant.int 2
%int3_850 = torch.constant.int 3
%1506 = torch.aten.transpose.int %1505, %int2_849, %int3_850 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1507 = torch.aten.matmul %1496, %1506 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1508 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1509 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1510 = torch.aten.pow.Tensor_Tensor %1508, %1509 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1511 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_851 = torch.constant.int 0
%1512 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_852 = torch.constant.none
%float0.000000e00_853 = torch.constant.float 0.000000e+00
%1513 = torch.aten.full %1512, %float0.000000e00_853, %none_852, %none_852, %none_852, %none_852 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_854 = torch.constant.int 1
%1514 = torch.aten.add.Tensor %1513, %1510, %int1_854 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1515 = torch.aten.div.Tensor %1507, %1514 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1516 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_855 = torch.constant.int 6
%none_856 = torch.constant.none
%false_857 = torch.constant.bool false
%1517 = torch.aten.to.dtype %1515, %int6_855, %false_857, %false_857, %none_856 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1518 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1519 = torch.aten.where.self %1516, %1517, %1518 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_858 = torch.constant.int 3
%none_859 = torch.constant.none
%1520 = torch.aten.softmax.int %1519, %int3_858, %none_859 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_860 = torch.constant.int 6
%none_861 = torch.constant.none
%false_862 = torch.constant.bool false
%1521 = torch.aten.to.dtype %1520, %int6_860, %false_862, %false_862, %none_861 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1522 = torch.aten.matmul %1521, %1504 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_863 = torch.constant.int 1
%int2_864 = torch.constant.int 2
%1523 = torch.aten.transpose.int %1522, %int1_863, %int2_864 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1524 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_865 = torch.constant.int 1
%int7_866 = torch.constant.int 7
%int1600_867 = torch.constant.int 1600
%1525 = torch.prim.ListConstruct %int1_865, %int7_866, %int1600_867 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1526 = torch.aten.reshape %1523, %1525 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1527 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_868 = torch.constant.int 7
%int1600_869 = torch.constant.int 1600
%1528 = torch.prim.ListConstruct %int7_868, %int1600_869 : (!torch.int, !torch.int) -> !torch.list<int>
%1529 = torch.aten.reshape %1526, %1528 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_870 = torch.constant.int 0
%int1_871 = torch.constant.int 1
%1530 = torch.aten.mm %1529, %126 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1531 = torch.aten.add.Tensor %1530, %127, %int1_871 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1532 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_872 = torch.constant.int 1
%int7_873 = torch.constant.int 7
%int1600_874 = torch.constant.int 1600
%1533 = torch.prim.ListConstruct %int1_872, %int7_873, %int1600_874 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1534 = torch.aten.reshape %1531, %1533 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_875 = torch.constant.int 1
%1535 = torch.aten.add.Tensor %1534, %1479, %int1_875 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_876 = torch.constant.float 9.9999997473787516E-6
%int1600_877 = torch.constant.int 1600
%1536 = torch.prim.ListConstruct %int1600_877 : (!torch.int) -> !torch.list<int>
%result0_878, %result1_879, %result2_880 = torch.aten.native_layer_norm %1535, %1536, %128, %129, %float9.999990e-06_876 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1537 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_881 = torch.constant.int 7
%int1600_882 = torch.constant.int 1600
%1538 = torch.prim.ListConstruct %int7_881, %int1600_882 : (!torch.int, !torch.int) -> !torch.list<int>
%1539 = torch.aten.reshape %result0_878, %1538 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_883 = torch.constant.int 0
%int1_884 = torch.constant.int 1
%1540 = torch.aten.mm %1539, %130 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1541 = torch.aten.add.Tensor %1540, %131, %int1_884 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1542 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_885 = torch.constant.int 1
%int7_886 = torch.constant.int 7
%int6400_887 = torch.constant.int 6400
%1543 = torch.prim.ListConstruct %int1_885, %int7_886, %int6400_887 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1544 = torch.aten.reshape %1541, %1543 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1545 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1546 = torch.aten.mul.Tensor %1544, %1545 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1547 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1548 = torch.aten.pow.Tensor_Tensor %1544, %1547 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1549 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1550 = torch.aten.mul.Tensor %1548, %1549 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_888 = torch.constant.int 1
%1551 = torch.aten.add.Tensor %1544, %1550, %int1_888 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1552 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1553 = torch.aten.mul.Tensor %1551, %1552 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1554 = torch.aten.tanh %1553 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1555 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_889 = torch.constant.int 1
%1556 = torch.aten.add.Tensor %1554, %1555, %int1_889 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1557 = torch.aten.mul.Tensor %1546, %1556 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1558 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_890 = torch.constant.int 7
%int6400_891 = torch.constant.int 6400
%1559 = torch.prim.ListConstruct %int7_890, %int6400_891 : (!torch.int, !torch.int) -> !torch.list<int>
%1560 = torch.aten.reshape %1557, %1559 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_892 = torch.constant.int 0
%int1_893 = torch.constant.int 1
%1561 = torch.aten.mm %1560, %132 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1562 = torch.aten.add.Tensor %1561, %133, %int1_893 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1563 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_894 = torch.constant.int 1
%int7_895 = torch.constant.int 7
%int1600_896 = torch.constant.int 1600
%1564 = torch.prim.ListConstruct %int1_894, %int7_895, %int1600_896 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1565 = torch.aten.reshape %1562, %1564 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_897 = torch.constant.int 1
%1566 = torch.aten.add.Tensor %1535, %1565, %int1_897 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_898 = torch.constant.float 9.9999997473787516E-6
%int1600_899 = torch.constant.int 1600
%1567 = torch.prim.ListConstruct %int1600_899 : (!torch.int) -> !torch.list<int>
%result0_900, %result1_901, %result2_902 = torch.aten.native_layer_norm %1566, %1567, %134, %135, %float9.999990e-06_898 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1568 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_903 = torch.constant.int 7
%int1600_904 = torch.constant.int 1600
%1569 = torch.prim.ListConstruct %int7_903, %int1600_904 : (!torch.int, !torch.int) -> !torch.list<int>
%1570 = torch.aten.reshape %result0_900, %1569 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_905 = torch.constant.int 0
%int1_906 = torch.constant.int 1
%1571 = torch.aten.mm %1570, %136 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1572 = torch.aten.add.Tensor %1571, %137, %int1_906 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1573 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_907 = torch.constant.int 1
%int7_908 = torch.constant.int 7
%int4800_909 = torch.constant.int 4800
%1574 = torch.prim.ListConstruct %int1_907, %int7_908, %int4800_909 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1575 = torch.aten.reshape %1572, %1574 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1576 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1577 = torch.prim.tolist(%1576) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_910 = torch.constant.int 2
%1578 = torch.aten.split_with_sizes %1575, %1577, %int2_910 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1579:3 = torch.prim.ListUnpack %1578 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1580 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_911 = torch.constant.int 1
%int7_912 = torch.constant.int 7
%int25_913 = torch.constant.int 25
%int64_914 = torch.constant.int 64
%1581 = torch.prim.ListConstruct %int1_911, %int7_912, %int25_913, %int64_914 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1582 = torch.aten.reshape %1579#0, %1581 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_915 = torch.constant.int 1
%int2_916 = torch.constant.int 2
%1583 = torch.aten.transpose.int %1582, %int1_915, %int2_916 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1584 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_917 = torch.constant.int 1
%int7_918 = torch.constant.int 7
%int25_919 = torch.constant.int 25
%int64_920 = torch.constant.int 64
%1585 = torch.prim.ListConstruct %int1_917, %int7_918, %int25_919, %int64_920 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1586 = torch.aten.reshape %1579#1, %1585 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_921 = torch.constant.int 1
%int2_922 = torch.constant.int 2
%1587 = torch.aten.transpose.int %1586, %int1_921, %int2_922 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1588 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_923 = torch.constant.int 1
%int7_924 = torch.constant.int 7
%int25_925 = torch.constant.int 25
%int64_926 = torch.constant.int 64
%1589 = torch.prim.ListConstruct %int1_923, %int7_924, %int25_925, %int64_926 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1590 = torch.aten.reshape %1579#2, %1589 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_927 = torch.constant.int 1
%int2_928 = torch.constant.int 2
%1591 = torch.aten.transpose.int %1590, %int1_927, %int2_928 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_929 = torch.constant.int 1
%int2_930 = torch.constant.int 2
%1592 = torch.aten.transpose.int %1586, %int1_929, %int2_930 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_931 = torch.constant.int 2
%int3_932 = torch.constant.int 3
%1593 = torch.aten.transpose.int %1592, %int2_931, %int3_932 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1594 = torch.aten.matmul %1583, %1593 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1595 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1596 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1597 = torch.aten.pow.Tensor_Tensor %1595, %1596 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1598 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_933 = torch.constant.int 0
%1599 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_934 = torch.constant.none
%float0.000000e00_935 = torch.constant.float 0.000000e+00
%1600 = torch.aten.full %1599, %float0.000000e00_935, %none_934, %none_934, %none_934, %none_934 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_936 = torch.constant.int 1
%1601 = torch.aten.add.Tensor %1600, %1597, %int1_936 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1602 = torch.aten.div.Tensor %1594, %1601 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1603 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_937 = torch.constant.int 6
%none_938 = torch.constant.none
%false_939 = torch.constant.bool false
%1604 = torch.aten.to.dtype %1602, %int6_937, %false_939, %false_939, %none_938 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1605 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1606 = torch.aten.where.self %1603, %1604, %1605 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_940 = torch.constant.int 3
%none_941 = torch.constant.none
%1607 = torch.aten.softmax.int %1606, %int3_940, %none_941 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_942 = torch.constant.int 6
%none_943 = torch.constant.none
%false_944 = torch.constant.bool false
%1608 = torch.aten.to.dtype %1607, %int6_942, %false_944, %false_944, %none_943 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1609 = torch.aten.matmul %1608, %1591 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_945 = torch.constant.int 1
%int2_946 = torch.constant.int 2
%1610 = torch.aten.transpose.int %1609, %int1_945, %int2_946 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1611 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_947 = torch.constant.int 1
%int7_948 = torch.constant.int 7
%int1600_949 = torch.constant.int 1600
%1612 = torch.prim.ListConstruct %int1_947, %int7_948, %int1600_949 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1613 = torch.aten.reshape %1610, %1612 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1614 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_950 = torch.constant.int 7
%int1600_951 = torch.constant.int 1600
%1615 = torch.prim.ListConstruct %int7_950, %int1600_951 : (!torch.int, !torch.int) -> !torch.list<int>
%1616 = torch.aten.reshape %1613, %1615 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_952 = torch.constant.int 0
%int1_953 = torch.constant.int 1
%1617 = torch.aten.mm %1616, %138 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1618 = torch.aten.add.Tensor %1617, %139, %int1_953 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1619 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_954 = torch.constant.int 1
%int7_955 = torch.constant.int 7
%int1600_956 = torch.constant.int 1600
%1620 = torch.prim.ListConstruct %int1_954, %int7_955, %int1600_956 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1621 = torch.aten.reshape %1618, %1620 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_957 = torch.constant.int 1
%1622 = torch.aten.add.Tensor %1621, %1566, %int1_957 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_958 = torch.constant.float 9.9999997473787516E-6
%int1600_959 = torch.constant.int 1600
%1623 = torch.prim.ListConstruct %int1600_959 : (!torch.int) -> !torch.list<int>
%result0_960, %result1_961, %result2_962 = torch.aten.native_layer_norm %1622, %1623, %140, %141, %float9.999990e-06_958 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1624 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_963 = torch.constant.int 7
%int1600_964 = torch.constant.int 1600
%1625 = torch.prim.ListConstruct %int7_963, %int1600_964 : (!torch.int, !torch.int) -> !torch.list<int>
%1626 = torch.aten.reshape %result0_960, %1625 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_965 = torch.constant.int 0
%int1_966 = torch.constant.int 1
%1627 = torch.aten.mm %1626, %142 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1628 = torch.aten.add.Tensor %1627, %143, %int1_966 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1629 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_967 = torch.constant.int 1
%int7_968 = torch.constant.int 7
%int6400_969 = torch.constant.int 6400
%1630 = torch.prim.ListConstruct %int1_967, %int7_968, %int6400_969 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1631 = torch.aten.reshape %1628, %1630 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1632 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1633 = torch.aten.mul.Tensor %1631, %1632 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1634 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1635 = torch.aten.pow.Tensor_Tensor %1631, %1634 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1636 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1637 = torch.aten.mul.Tensor %1635, %1636 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_970 = torch.constant.int 1
%1638 = torch.aten.add.Tensor %1631, %1637, %int1_970 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1639 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1640 = torch.aten.mul.Tensor %1638, %1639 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1641 = torch.aten.tanh %1640 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1642 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_971 = torch.constant.int 1
%1643 = torch.aten.add.Tensor %1641, %1642, %int1_971 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1644 = torch.aten.mul.Tensor %1633, %1643 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1645 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_972 = torch.constant.int 7
%int6400_973 = torch.constant.int 6400
%1646 = torch.prim.ListConstruct %int7_972, %int6400_973 : (!torch.int, !torch.int) -> !torch.list<int>
%1647 = torch.aten.reshape %1644, %1646 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_974 = torch.constant.int 0
%int1_975 = torch.constant.int 1
%1648 = torch.aten.mm %1647, %144 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1649 = torch.aten.add.Tensor %1648, %145, %int1_975 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1650 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_976 = torch.constant.int 1
%int7_977 = torch.constant.int 7
%int1600_978 = torch.constant.int 1600
%1651 = torch.prim.ListConstruct %int1_976, %int7_977, %int1600_978 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1652 = torch.aten.reshape %1649, %1651 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_979 = torch.constant.int 1
%1653 = torch.aten.add.Tensor %1622, %1652, %int1_979 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_980 = torch.constant.float 9.9999997473787516E-6
%int1600_981 = torch.constant.int 1600
%1654 = torch.prim.ListConstruct %int1600_981 : (!torch.int) -> !torch.list<int>
%result0_982, %result1_983, %result2_984 = torch.aten.native_layer_norm %1653, %1654, %146, %147, %float9.999990e-06_980 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1655 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_985 = torch.constant.int 7
%int1600_986 = torch.constant.int 1600
%1656 = torch.prim.ListConstruct %int7_985, %int1600_986 : (!torch.int, !torch.int) -> !torch.list<int>
%1657 = torch.aten.reshape %result0_982, %1656 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_987 = torch.constant.int 0
%int1_988 = torch.constant.int 1
%1658 = torch.aten.mm %1657, %148 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1659 = torch.aten.add.Tensor %1658, %149, %int1_988 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1660 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_989 = torch.constant.int 1
%int7_990 = torch.constant.int 7
%int4800_991 = torch.constant.int 4800
%1661 = torch.prim.ListConstruct %int1_989, %int7_990, %int4800_991 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1662 = torch.aten.reshape %1659, %1661 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1663 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1664 = torch.prim.tolist(%1663) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_992 = torch.constant.int 2
%1665 = torch.aten.split_with_sizes %1662, %1664, %int2_992 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1666:3 = torch.prim.ListUnpack %1665 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1667 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_993 = torch.constant.int 1
%int7_994 = torch.constant.int 7
%int25_995 = torch.constant.int 25
%int64_996 = torch.constant.int 64
%1668 = torch.prim.ListConstruct %int1_993, %int7_994, %int25_995, %int64_996 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1669 = torch.aten.reshape %1666#0, %1668 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_997 = torch.constant.int 1
%int2_998 = torch.constant.int 2
%1670 = torch.aten.transpose.int %1669, %int1_997, %int2_998 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1671 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_999 = torch.constant.int 1
%int7_1000 = torch.constant.int 7
%int25_1001 = torch.constant.int 25
%int64_1002 = torch.constant.int 64
%1672 = torch.prim.ListConstruct %int1_999, %int7_1000, %int25_1001, %int64_1002 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1673 = torch.aten.reshape %1666#1, %1672 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1003 = torch.constant.int 1
%int2_1004 = torch.constant.int 2
%1674 = torch.aten.transpose.int %1673, %int1_1003, %int2_1004 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1675 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1005 = torch.constant.int 1
%int7_1006 = torch.constant.int 7
%int25_1007 = torch.constant.int 25
%int64_1008 = torch.constant.int 64
%1676 = torch.prim.ListConstruct %int1_1005, %int7_1006, %int25_1007, %int64_1008 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1677 = torch.aten.reshape %1666#2, %1676 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1009 = torch.constant.int 1
%int2_1010 = torch.constant.int 2
%1678 = torch.aten.transpose.int %1677, %int1_1009, %int2_1010 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1011 = torch.constant.int 1
%int2_1012 = torch.constant.int 2
%1679 = torch.aten.transpose.int %1673, %int1_1011, %int2_1012 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1013 = torch.constant.int 2
%int3_1014 = torch.constant.int 3
%1680 = torch.aten.transpose.int %1679, %int2_1013, %int3_1014 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1681 = torch.aten.matmul %1670, %1680 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1682 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1683 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1684 = torch.aten.pow.Tensor_Tensor %1682, %1683 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1685 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1015 = torch.constant.int 0
%1686 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1016 = torch.constant.none
%float0.000000e00_1017 = torch.constant.float 0.000000e+00
%1687 = torch.aten.full %1686, %float0.000000e00_1017, %none_1016, %none_1016, %none_1016, %none_1016 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1018 = torch.constant.int 1
%1688 = torch.aten.add.Tensor %1687, %1684, %int1_1018 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1689 = torch.aten.div.Tensor %1681, %1688 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1690 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1019 = torch.constant.int 6
%none_1020 = torch.constant.none
%false_1021 = torch.constant.bool false
%1691 = torch.aten.to.dtype %1689, %int6_1019, %false_1021, %false_1021, %none_1020 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1692 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1693 = torch.aten.where.self %1690, %1691, %1692 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1022 = torch.constant.int 3
%none_1023 = torch.constant.none
%1694 = torch.aten.softmax.int %1693, %int3_1022, %none_1023 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1024 = torch.constant.int 6
%none_1025 = torch.constant.none
%false_1026 = torch.constant.bool false
%1695 = torch.aten.to.dtype %1694, %int6_1024, %false_1026, %false_1026, %none_1025 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1696 = torch.aten.matmul %1695, %1678 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1027 = torch.constant.int 1
%int2_1028 = torch.constant.int 2
%1697 = torch.aten.transpose.int %1696, %int1_1027, %int2_1028 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1698 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1029 = torch.constant.int 1
%int7_1030 = torch.constant.int 7
%int1600_1031 = torch.constant.int 1600
%1699 = torch.prim.ListConstruct %int1_1029, %int7_1030, %int1600_1031 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1700 = torch.aten.reshape %1697, %1699 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1701 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1032 = torch.constant.int 7
%int1600_1033 = torch.constant.int 1600
%1702 = torch.prim.ListConstruct %int7_1032, %int1600_1033 : (!torch.int, !torch.int) -> !torch.list<int>
%1703 = torch.aten.reshape %1700, %1702 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1034 = torch.constant.int 0
%int1_1035 = torch.constant.int 1
%1704 = torch.aten.mm %1703, %150 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1705 = torch.aten.add.Tensor %1704, %151, %int1_1035 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1706 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1036 = torch.constant.int 1
%int7_1037 = torch.constant.int 7
%int1600_1038 = torch.constant.int 1600
%1707 = torch.prim.ListConstruct %int1_1036, %int7_1037, %int1600_1038 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1708 = torch.aten.reshape %1705, %1707 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1039 = torch.constant.int 1
%1709 = torch.aten.add.Tensor %1708, %1653, %int1_1039 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1040 = torch.constant.float 9.9999997473787516E-6
%int1600_1041 = torch.constant.int 1600
%1710 = torch.prim.ListConstruct %int1600_1041 : (!torch.int) -> !torch.list<int>
%result0_1042, %result1_1043, %result2_1044 = torch.aten.native_layer_norm %1709, %1710, %152, %153, %float9.999990e-06_1040 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1711 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1045 = torch.constant.int 7
%int1600_1046 = torch.constant.int 1600
%1712 = torch.prim.ListConstruct %int7_1045, %int1600_1046 : (!torch.int, !torch.int) -> !torch.list<int>
%1713 = torch.aten.reshape %result0_1042, %1712 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1047 = torch.constant.int 0
%int1_1048 = torch.constant.int 1
%1714 = torch.aten.mm %1713, %154 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1715 = torch.aten.add.Tensor %1714, %155, %int1_1048 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1716 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1049 = torch.constant.int 1
%int7_1050 = torch.constant.int 7
%int6400_1051 = torch.constant.int 6400
%1717 = torch.prim.ListConstruct %int1_1049, %int7_1050, %int6400_1051 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1718 = torch.aten.reshape %1715, %1717 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1719 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1720 = torch.aten.mul.Tensor %1718, %1719 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1721 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1722 = torch.aten.pow.Tensor_Tensor %1718, %1721 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1723 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1724 = torch.aten.mul.Tensor %1722, %1723 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1052 = torch.constant.int 1
%1725 = torch.aten.add.Tensor %1718, %1724, %int1_1052 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1726 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1727 = torch.aten.mul.Tensor %1725, %1726 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1728 = torch.aten.tanh %1727 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1729 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1053 = torch.constant.int 1
%1730 = torch.aten.add.Tensor %1728, %1729, %int1_1053 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1731 = torch.aten.mul.Tensor %1720, %1730 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1732 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1054 = torch.constant.int 7
%int6400_1055 = torch.constant.int 6400
%1733 = torch.prim.ListConstruct %int7_1054, %int6400_1055 : (!torch.int, !torch.int) -> !torch.list<int>
%1734 = torch.aten.reshape %1731, %1733 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1056 = torch.constant.int 0
%int1_1057 = torch.constant.int 1
%1735 = torch.aten.mm %1734, %156 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1736 = torch.aten.add.Tensor %1735, %157, %int1_1057 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1737 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1058 = torch.constant.int 1
%int7_1059 = torch.constant.int 7
%int1600_1060 = torch.constant.int 1600
%1738 = torch.prim.ListConstruct %int1_1058, %int7_1059, %int1600_1060 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1739 = torch.aten.reshape %1736, %1738 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1061 = torch.constant.int 1
%1740 = torch.aten.add.Tensor %1709, %1739, %int1_1061 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1062 = torch.constant.float 9.9999997473787516E-6
%int1600_1063 = torch.constant.int 1600
%1741 = torch.prim.ListConstruct %int1600_1063 : (!torch.int) -> !torch.list<int>
%result0_1064, %result1_1065, %result2_1066 = torch.aten.native_layer_norm %1740, %1741, %158, %159, %float9.999990e-06_1062 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1742 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1067 = torch.constant.int 7
%int1600_1068 = torch.constant.int 1600
%1743 = torch.prim.ListConstruct %int7_1067, %int1600_1068 : (!torch.int, !torch.int) -> !torch.list<int>
%1744 = torch.aten.reshape %result0_1064, %1743 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1069 = torch.constant.int 0
%int1_1070 = torch.constant.int 1
%1745 = torch.aten.mm %1744, %160 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1746 = torch.aten.add.Tensor %1745, %161, %int1_1070 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1747 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1071 = torch.constant.int 1
%int7_1072 = torch.constant.int 7
%int4800_1073 = torch.constant.int 4800
%1748 = torch.prim.ListConstruct %int1_1071, %int7_1072, %int4800_1073 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1749 = torch.aten.reshape %1746, %1748 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1750 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1751 = torch.prim.tolist(%1750) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1074 = torch.constant.int 2
%1752 = torch.aten.split_with_sizes %1749, %1751, %int2_1074 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1753:3 = torch.prim.ListUnpack %1752 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1754 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1075 = torch.constant.int 1
%int7_1076 = torch.constant.int 7
%int25_1077 = torch.constant.int 25
%int64_1078 = torch.constant.int 64
%1755 = torch.prim.ListConstruct %int1_1075, %int7_1076, %int25_1077, %int64_1078 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1756 = torch.aten.reshape %1753#0, %1755 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1079 = torch.constant.int 1
%int2_1080 = torch.constant.int 2
%1757 = torch.aten.transpose.int %1756, %int1_1079, %int2_1080 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1758 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1081 = torch.constant.int 1
%int7_1082 = torch.constant.int 7
%int25_1083 = torch.constant.int 25
%int64_1084 = torch.constant.int 64
%1759 = torch.prim.ListConstruct %int1_1081, %int7_1082, %int25_1083, %int64_1084 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1760 = torch.aten.reshape %1753#1, %1759 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1085 = torch.constant.int 1
%int2_1086 = torch.constant.int 2
%1761 = torch.aten.transpose.int %1760, %int1_1085, %int2_1086 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1762 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1087 = torch.constant.int 1
%int7_1088 = torch.constant.int 7
%int25_1089 = torch.constant.int 25
%int64_1090 = torch.constant.int 64
%1763 = torch.prim.ListConstruct %int1_1087, %int7_1088, %int25_1089, %int64_1090 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1764 = torch.aten.reshape %1753#2, %1763 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1091 = torch.constant.int 1
%int2_1092 = torch.constant.int 2
%1765 = torch.aten.transpose.int %1764, %int1_1091, %int2_1092 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1093 = torch.constant.int 1
%int2_1094 = torch.constant.int 2
%1766 = torch.aten.transpose.int %1760, %int1_1093, %int2_1094 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1095 = torch.constant.int 2
%int3_1096 = torch.constant.int 3
%1767 = torch.aten.transpose.int %1766, %int2_1095, %int3_1096 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1768 = torch.aten.matmul %1757, %1767 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1769 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1770 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1771 = torch.aten.pow.Tensor_Tensor %1769, %1770 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1772 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1097 = torch.constant.int 0
%1773 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1098 = torch.constant.none
%float0.000000e00_1099 = torch.constant.float 0.000000e+00
%1774 = torch.aten.full %1773, %float0.000000e00_1099, %none_1098, %none_1098, %none_1098, %none_1098 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1100 = torch.constant.int 1
%1775 = torch.aten.add.Tensor %1774, %1771, %int1_1100 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1776 = torch.aten.div.Tensor %1768, %1775 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1777 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1101 = torch.constant.int 6
%none_1102 = torch.constant.none
%false_1103 = torch.constant.bool false
%1778 = torch.aten.to.dtype %1776, %int6_1101, %false_1103, %false_1103, %none_1102 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1779 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1780 = torch.aten.where.self %1777, %1778, %1779 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1104 = torch.constant.int 3
%none_1105 = torch.constant.none
%1781 = torch.aten.softmax.int %1780, %int3_1104, %none_1105 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1106 = torch.constant.int 6
%none_1107 = torch.constant.none
%false_1108 = torch.constant.bool false
%1782 = torch.aten.to.dtype %1781, %int6_1106, %false_1108, %false_1108, %none_1107 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1783 = torch.aten.matmul %1782, %1765 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1109 = torch.constant.int 1
%int2_1110 = torch.constant.int 2
%1784 = torch.aten.transpose.int %1783, %int1_1109, %int2_1110 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1785 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1111 = torch.constant.int 1
%int7_1112 = torch.constant.int 7
%int1600_1113 = torch.constant.int 1600
%1786 = torch.prim.ListConstruct %int1_1111, %int7_1112, %int1600_1113 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1787 = torch.aten.reshape %1784, %1786 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1788 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1114 = torch.constant.int 7
%int1600_1115 = torch.constant.int 1600
%1789 = torch.prim.ListConstruct %int7_1114, %int1600_1115 : (!torch.int, !torch.int) -> !torch.list<int>
%1790 = torch.aten.reshape %1787, %1789 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1116 = torch.constant.int 0
%int1_1117 = torch.constant.int 1
%1791 = torch.aten.mm %1790, %162 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1792 = torch.aten.add.Tensor %1791, %163, %int1_1117 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1793 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1118 = torch.constant.int 1
%int7_1119 = torch.constant.int 7
%int1600_1120 = torch.constant.int 1600
%1794 = torch.prim.ListConstruct %int1_1118, %int7_1119, %int1600_1120 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1795 = torch.aten.reshape %1792, %1794 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1121 = torch.constant.int 1
%1796 = torch.aten.add.Tensor %1795, %1740, %int1_1121 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1122 = torch.constant.float 9.9999997473787516E-6
%int1600_1123 = torch.constant.int 1600
%1797 = torch.prim.ListConstruct %int1600_1123 : (!torch.int) -> !torch.list<int>
%result0_1124, %result1_1125, %result2_1126 = torch.aten.native_layer_norm %1796, %1797, %164, %165, %float9.999990e-06_1122 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1798 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1127 = torch.constant.int 7
%int1600_1128 = torch.constant.int 1600
%1799 = torch.prim.ListConstruct %int7_1127, %int1600_1128 : (!torch.int, !torch.int) -> !torch.list<int>
%1800 = torch.aten.reshape %result0_1124, %1799 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1129 = torch.constant.int 0
%int1_1130 = torch.constant.int 1
%1801 = torch.aten.mm %1800, %166 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1802 = torch.aten.add.Tensor %1801, %167, %int1_1130 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1803 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1131 = torch.constant.int 1
%int7_1132 = torch.constant.int 7
%int6400_1133 = torch.constant.int 6400
%1804 = torch.prim.ListConstruct %int1_1131, %int7_1132, %int6400_1133 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1805 = torch.aten.reshape %1802, %1804 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1806 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1807 = torch.aten.mul.Tensor %1805, %1806 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1808 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1809 = torch.aten.pow.Tensor_Tensor %1805, %1808 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1810 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1811 = torch.aten.mul.Tensor %1809, %1810 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1134 = torch.constant.int 1
%1812 = torch.aten.add.Tensor %1805, %1811, %int1_1134 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1813 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1814 = torch.aten.mul.Tensor %1812, %1813 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1815 = torch.aten.tanh %1814 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1816 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1135 = torch.constant.int 1
%1817 = torch.aten.add.Tensor %1815, %1816, %int1_1135 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1818 = torch.aten.mul.Tensor %1807, %1817 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1819 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1136 = torch.constant.int 7
%int6400_1137 = torch.constant.int 6400
%1820 = torch.prim.ListConstruct %int7_1136, %int6400_1137 : (!torch.int, !torch.int) -> !torch.list<int>
%1821 = torch.aten.reshape %1818, %1820 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1138 = torch.constant.int 0
%int1_1139 = torch.constant.int 1
%1822 = torch.aten.mm %1821, %168 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1823 = torch.aten.add.Tensor %1822, %169, %int1_1139 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1824 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1140 = torch.constant.int 1
%int7_1141 = torch.constant.int 7
%int1600_1142 = torch.constant.int 1600
%1825 = torch.prim.ListConstruct %int1_1140, %int7_1141, %int1600_1142 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1826 = torch.aten.reshape %1823, %1825 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1143 = torch.constant.int 1
%1827 = torch.aten.add.Tensor %1796, %1826, %int1_1143 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1144 = torch.constant.float 9.9999997473787516E-6
%int1600_1145 = torch.constant.int 1600
%1828 = torch.prim.ListConstruct %int1600_1145 : (!torch.int) -> !torch.list<int>
%result0_1146, %result1_1147, %result2_1148 = torch.aten.native_layer_norm %1827, %1828, %170, %171, %float9.999990e-06_1144 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1829 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1149 = torch.constant.int 7
%int1600_1150 = torch.constant.int 1600
%1830 = torch.prim.ListConstruct %int7_1149, %int1600_1150 : (!torch.int, !torch.int) -> !torch.list<int>
%1831 = torch.aten.reshape %result0_1146, %1830 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1151 = torch.constant.int 0
%int1_1152 = torch.constant.int 1
%1832 = torch.aten.mm %1831, %172 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1833 = torch.aten.add.Tensor %1832, %173, %int1_1152 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1834 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1153 = torch.constant.int 1
%int7_1154 = torch.constant.int 7
%int4800_1155 = torch.constant.int 4800
%1835 = torch.prim.ListConstruct %int1_1153, %int7_1154, %int4800_1155 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1836 = torch.aten.reshape %1833, %1835 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1837 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1838 = torch.prim.tolist(%1837) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1156 = torch.constant.int 2
%1839 = torch.aten.split_with_sizes %1836, %1838, %int2_1156 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1840:3 = torch.prim.ListUnpack %1839 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1841 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1157 = torch.constant.int 1
%int7_1158 = torch.constant.int 7
%int25_1159 = torch.constant.int 25
%int64_1160 = torch.constant.int 64
%1842 = torch.prim.ListConstruct %int1_1157, %int7_1158, %int25_1159, %int64_1160 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1843 = torch.aten.reshape %1840#0, %1842 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1161 = torch.constant.int 1
%int2_1162 = torch.constant.int 2
%1844 = torch.aten.transpose.int %1843, %int1_1161, %int2_1162 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1845 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1163 = torch.constant.int 1
%int7_1164 = torch.constant.int 7
%int25_1165 = torch.constant.int 25
%int64_1166 = torch.constant.int 64
%1846 = torch.prim.ListConstruct %int1_1163, %int7_1164, %int25_1165, %int64_1166 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1847 = torch.aten.reshape %1840#1, %1846 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1167 = torch.constant.int 1
%int2_1168 = torch.constant.int 2
%1848 = torch.aten.transpose.int %1847, %int1_1167, %int2_1168 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1849 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1169 = torch.constant.int 1
%int7_1170 = torch.constant.int 7
%int25_1171 = torch.constant.int 25
%int64_1172 = torch.constant.int 64
%1850 = torch.prim.ListConstruct %int1_1169, %int7_1170, %int25_1171, %int64_1172 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1851 = torch.aten.reshape %1840#2, %1850 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1173 = torch.constant.int 1
%int2_1174 = torch.constant.int 2
%1852 = torch.aten.transpose.int %1851, %int1_1173, %int2_1174 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1175 = torch.constant.int 1
%int2_1176 = torch.constant.int 2
%1853 = torch.aten.transpose.int %1847, %int1_1175, %int2_1176 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1177 = torch.constant.int 2
%int3_1178 = torch.constant.int 3
%1854 = torch.aten.transpose.int %1853, %int2_1177, %int3_1178 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1855 = torch.aten.matmul %1844, %1854 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1856 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1857 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1858 = torch.aten.pow.Tensor_Tensor %1856, %1857 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1859 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1179 = torch.constant.int 0
%1860 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1180 = torch.constant.none
%float0.000000e00_1181 = torch.constant.float 0.000000e+00
%1861 = torch.aten.full %1860, %float0.000000e00_1181, %none_1180, %none_1180, %none_1180, %none_1180 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1182 = torch.constant.int 1
%1862 = torch.aten.add.Tensor %1861, %1858, %int1_1182 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1863 = torch.aten.div.Tensor %1855, %1862 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1864 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1183 = torch.constant.int 6
%none_1184 = torch.constant.none
%false_1185 = torch.constant.bool false
%1865 = torch.aten.to.dtype %1863, %int6_1183, %false_1185, %false_1185, %none_1184 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1866 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1867 = torch.aten.where.self %1864, %1865, %1866 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1186 = torch.constant.int 3
%none_1187 = torch.constant.none
%1868 = torch.aten.softmax.int %1867, %int3_1186, %none_1187 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1188 = torch.constant.int 6
%none_1189 = torch.constant.none
%false_1190 = torch.constant.bool false
%1869 = torch.aten.to.dtype %1868, %int6_1188, %false_1190, %false_1190, %none_1189 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1870 = torch.aten.matmul %1869, %1852 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1191 = torch.constant.int 1
%int2_1192 = torch.constant.int 2
%1871 = torch.aten.transpose.int %1870, %int1_1191, %int2_1192 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1872 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1193 = torch.constant.int 1
%int7_1194 = torch.constant.int 7
%int1600_1195 = torch.constant.int 1600
%1873 = torch.prim.ListConstruct %int1_1193, %int7_1194, %int1600_1195 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1874 = torch.aten.reshape %1871, %1873 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1875 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1196 = torch.constant.int 7
%int1600_1197 = torch.constant.int 1600
%1876 = torch.prim.ListConstruct %int7_1196, %int1600_1197 : (!torch.int, !torch.int) -> !torch.list<int>
%1877 = torch.aten.reshape %1874, %1876 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1198 = torch.constant.int 0
%int1_1199 = torch.constant.int 1
%1878 = torch.aten.mm %1877, %174 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1879 = torch.aten.add.Tensor %1878, %175, %int1_1199 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1880 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1200 = torch.constant.int 1
%int7_1201 = torch.constant.int 7
%int1600_1202 = torch.constant.int 1600
%1881 = torch.prim.ListConstruct %int1_1200, %int7_1201, %int1600_1202 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1882 = torch.aten.reshape %1879, %1881 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1203 = torch.constant.int 1
%1883 = torch.aten.add.Tensor %1882, %1827, %int1_1203 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1204 = torch.constant.float 9.9999997473787516E-6
%int1600_1205 = torch.constant.int 1600
%1884 = torch.prim.ListConstruct %int1600_1205 : (!torch.int) -> !torch.list<int>
%result0_1206, %result1_1207, %result2_1208 = torch.aten.native_layer_norm %1883, %1884, %176, %177, %float9.999990e-06_1204 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1885 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1209 = torch.constant.int 7
%int1600_1210 = torch.constant.int 1600
%1886 = torch.prim.ListConstruct %int7_1209, %int1600_1210 : (!torch.int, !torch.int) -> !torch.list<int>
%1887 = torch.aten.reshape %result0_1206, %1886 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1211 = torch.constant.int 0
%int1_1212 = torch.constant.int 1
%1888 = torch.aten.mm %1887, %178 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1889 = torch.aten.add.Tensor %1888, %179, %int1_1212 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1890 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1213 = torch.constant.int 1
%int7_1214 = torch.constant.int 7
%int6400_1215 = torch.constant.int 6400
%1891 = torch.prim.ListConstruct %int1_1213, %int7_1214, %int6400_1215 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1892 = torch.aten.reshape %1889, %1891 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1893 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1894 = torch.aten.mul.Tensor %1892, %1893 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1895 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1896 = torch.aten.pow.Tensor_Tensor %1892, %1895 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1897 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1898 = torch.aten.mul.Tensor %1896, %1897 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1216 = torch.constant.int 1
%1899 = torch.aten.add.Tensor %1892, %1898, %int1_1216 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1900 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1901 = torch.aten.mul.Tensor %1899, %1900 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1902 = torch.aten.tanh %1901 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1903 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1217 = torch.constant.int 1
%1904 = torch.aten.add.Tensor %1902, %1903, %int1_1217 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1905 = torch.aten.mul.Tensor %1894, %1904 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1906 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1218 = torch.constant.int 7
%int6400_1219 = torch.constant.int 6400
%1907 = torch.prim.ListConstruct %int7_1218, %int6400_1219 : (!torch.int, !torch.int) -> !torch.list<int>
%1908 = torch.aten.reshape %1905, %1907 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1220 = torch.constant.int 0
%int1_1221 = torch.constant.int 1
%1909 = torch.aten.mm %1908, %180 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1910 = torch.aten.add.Tensor %1909, %181, %int1_1221 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1911 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1222 = torch.constant.int 1
%int7_1223 = torch.constant.int 7
%int1600_1224 = torch.constant.int 1600
%1912 = torch.prim.ListConstruct %int1_1222, %int7_1223, %int1600_1224 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1913 = torch.aten.reshape %1910, %1912 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1225 = torch.constant.int 1
%1914 = torch.aten.add.Tensor %1883, %1913, %int1_1225 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1226 = torch.constant.float 9.9999997473787516E-6
%int1600_1227 = torch.constant.int 1600
%1915 = torch.prim.ListConstruct %int1600_1227 : (!torch.int) -> !torch.list<int>
%result0_1228, %result1_1229, %result2_1230 = torch.aten.native_layer_norm %1914, %1915, %182, %183, %float9.999990e-06_1226 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1916 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1231 = torch.constant.int 7
%int1600_1232 = torch.constant.int 1600
%1917 = torch.prim.ListConstruct %int7_1231, %int1600_1232 : (!torch.int, !torch.int) -> !torch.list<int>
%1918 = torch.aten.reshape %result0_1228, %1917 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1233 = torch.constant.int 0
%int1_1234 = torch.constant.int 1
%1919 = torch.aten.mm %1918, %184 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%1920 = torch.aten.add.Tensor %1919, %185, %int1_1234 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%1921 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1235 = torch.constant.int 1
%int7_1236 = torch.constant.int 7
%int4800_1237 = torch.constant.int 4800
%1922 = torch.prim.ListConstruct %int1_1235, %int7_1236, %int4800_1237 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1923 = torch.aten.reshape %1920, %1922 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%1924 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%1925 = torch.prim.tolist(%1924) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1238 = torch.constant.int 2
%1926 = torch.aten.split_with_sizes %1923, %1925, %int2_1238 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%1927:3 = torch.prim.ListUnpack %1926 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%1928 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1239 = torch.constant.int 1
%int7_1240 = torch.constant.int 7
%int25_1241 = torch.constant.int 25
%int64_1242 = torch.constant.int 64
%1929 = torch.prim.ListConstruct %int1_1239, %int7_1240, %int25_1241, %int64_1242 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1930 = torch.aten.reshape %1927#0, %1929 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1243 = torch.constant.int 1
%int2_1244 = torch.constant.int 2
%1931 = torch.aten.transpose.int %1930, %int1_1243, %int2_1244 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1932 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1245 = torch.constant.int 1
%int7_1246 = torch.constant.int 7
%int25_1247 = torch.constant.int 25
%int64_1248 = torch.constant.int 64
%1933 = torch.prim.ListConstruct %int1_1245, %int7_1246, %int25_1247, %int64_1248 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1934 = torch.aten.reshape %1927#1, %1933 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1249 = torch.constant.int 1
%int2_1250 = torch.constant.int 2
%1935 = torch.aten.transpose.int %1934, %int1_1249, %int2_1250 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%1936 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1251 = torch.constant.int 1
%int7_1252 = torch.constant.int 7
%int25_1253 = torch.constant.int 25
%int64_1254 = torch.constant.int 64
%1937 = torch.prim.ListConstruct %int1_1251, %int7_1252, %int25_1253, %int64_1254 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1938 = torch.aten.reshape %1927#2, %1937 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1255 = torch.constant.int 1
%int2_1256 = torch.constant.int 2
%1939 = torch.aten.transpose.int %1938, %int1_1255, %int2_1256 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1257 = torch.constant.int 1
%int2_1258 = torch.constant.int 2
%1940 = torch.aten.transpose.int %1934, %int1_1257, %int2_1258 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1259 = torch.constant.int 2
%int3_1260 = torch.constant.int 3
%1941 = torch.aten.transpose.int %1940, %int2_1259, %int3_1260 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%1942 = torch.aten.matmul %1931, %1941 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1943 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%1944 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1945 = torch.aten.pow.Tensor_Tensor %1943, %1944 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%1946 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1261 = torch.constant.int 0
%1947 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1262 = torch.constant.none
%float0.000000e00_1263 = torch.constant.float 0.000000e+00
%1948 = torch.aten.full %1947, %float0.000000e00_1263, %none_1262, %none_1262, %none_1262, %none_1262 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1264 = torch.constant.int 1
%1949 = torch.aten.add.Tensor %1948, %1945, %int1_1264 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%1950 = torch.aten.div.Tensor %1942, %1949 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%1951 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1265 = torch.constant.int 6
%none_1266 = torch.constant.none
%false_1267 = torch.constant.bool false
%1952 = torch.aten.to.dtype %1950, %int6_1265, %false_1267, %false_1267, %none_1266 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1953 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%1954 = torch.aten.where.self %1951, %1952, %1953 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1268 = torch.constant.int 3
%none_1269 = torch.constant.none
%1955 = torch.aten.softmax.int %1954, %int3_1268, %none_1269 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1270 = torch.constant.int 6
%none_1271 = torch.constant.none
%false_1272 = torch.constant.bool false
%1956 = torch.aten.to.dtype %1955, %int6_1270, %false_1272, %false_1272, %none_1271 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%1957 = torch.aten.matmul %1956, %1939 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1273 = torch.constant.int 1
%int2_1274 = torch.constant.int 2
%1958 = torch.aten.transpose.int %1957, %int1_1273, %int2_1274 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%1959 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1275 = torch.constant.int 1
%int7_1276 = torch.constant.int 7
%int1600_1277 = torch.constant.int 1600
%1960 = torch.prim.ListConstruct %int1_1275, %int7_1276, %int1600_1277 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1961 = torch.aten.reshape %1958, %1960 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%1962 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1278 = torch.constant.int 7
%int1600_1279 = torch.constant.int 1600
%1963 = torch.prim.ListConstruct %int7_1278, %int1600_1279 : (!torch.int, !torch.int) -> !torch.list<int>
%1964 = torch.aten.reshape %1961, %1963 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1280 = torch.constant.int 0
%int1_1281 = torch.constant.int 1
%1965 = torch.aten.mm %1964, %186 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1966 = torch.aten.add.Tensor %1965, %187, %int1_1281 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1967 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1282 = torch.constant.int 1
%int7_1283 = torch.constant.int 7
%int1600_1284 = torch.constant.int 1600
%1968 = torch.prim.ListConstruct %int1_1282, %int7_1283, %int1600_1284 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1969 = torch.aten.reshape %1966, %1968 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1285 = torch.constant.int 1
%1970 = torch.aten.add.Tensor %1969, %1914, %int1_1285 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1286 = torch.constant.float 9.9999997473787516E-6
%int1600_1287 = torch.constant.int 1600
%1971 = torch.prim.ListConstruct %int1600_1287 : (!torch.int) -> !torch.list<int>
%result0_1288, %result1_1289, %result2_1290 = torch.aten.native_layer_norm %1970, %1971, %188, %189, %float9.999990e-06_1286 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%1972 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1291 = torch.constant.int 7
%int1600_1292 = torch.constant.int 1600
%1973 = torch.prim.ListConstruct %int7_1291, %int1600_1292 : (!torch.int, !torch.int) -> !torch.list<int>
%1974 = torch.aten.reshape %result0_1288, %1973 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1293 = torch.constant.int 0
%int1_1294 = torch.constant.int 1
%1975 = torch.aten.mm %1974, %190 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%1976 = torch.aten.add.Tensor %1975, %191, %int1_1294 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%1977 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1295 = torch.constant.int 1
%int7_1296 = torch.constant.int 7
%int6400_1297 = torch.constant.int 6400
%1978 = torch.prim.ListConstruct %int1_1295, %int7_1296, %int6400_1297 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%1979 = torch.aten.reshape %1976, %1978 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%1980 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%1981 = torch.aten.mul.Tensor %1979, %1980 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1982 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%1983 = torch.aten.pow.Tensor_Tensor %1979, %1982 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1984 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%1985 = torch.aten.mul.Tensor %1983, %1984 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1298 = torch.constant.int 1
%1986 = torch.aten.add.Tensor %1979, %1985, %int1_1298 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1987 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%1988 = torch.aten.mul.Tensor %1986, %1987 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%1989 = torch.aten.tanh %1988 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1990 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1299 = torch.constant.int 1
%1991 = torch.aten.add.Tensor %1989, %1990, %int1_1299 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%1992 = torch.aten.mul.Tensor %1981, %1991 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%1993 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1300 = torch.constant.int 7
%int6400_1301 = torch.constant.int 6400
%1994 = torch.prim.ListConstruct %int7_1300, %int6400_1301 : (!torch.int, !torch.int) -> !torch.list<int>
%1995 = torch.aten.reshape %1992, %1994 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1302 = torch.constant.int 0
%int1_1303 = torch.constant.int 1
%1996 = torch.aten.mm %1995, %192 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%1997 = torch.aten.add.Tensor %1996, %193, %int1_1303 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%1998 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1304 = torch.constant.int 1
%int7_1305 = torch.constant.int 7
%int1600_1306 = torch.constant.int 1600
%1999 = torch.prim.ListConstruct %int1_1304, %int7_1305, %int1600_1306 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2000 = torch.aten.reshape %1997, %1999 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1307 = torch.constant.int 1
%2001 = torch.aten.add.Tensor %1970, %2000, %int1_1307 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1308 = torch.constant.float 9.9999997473787516E-6
%int1600_1309 = torch.constant.int 1600
%2002 = torch.prim.ListConstruct %int1600_1309 : (!torch.int) -> !torch.list<int>
%result0_1310, %result1_1311, %result2_1312 = torch.aten.native_layer_norm %2001, %2002, %194, %195, %float9.999990e-06_1308 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2003 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1313 = torch.constant.int 7
%int1600_1314 = torch.constant.int 1600
%2004 = torch.prim.ListConstruct %int7_1313, %int1600_1314 : (!torch.int, !torch.int) -> !torch.list<int>
%2005 = torch.aten.reshape %result0_1310, %2004 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1315 = torch.constant.int 0
%int1_1316 = torch.constant.int 1
%2006 = torch.aten.mm %2005, %196 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2007 = torch.aten.add.Tensor %2006, %197, %int1_1316 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2008 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1317 = torch.constant.int 1
%int7_1318 = torch.constant.int 7
%int4800_1319 = torch.constant.int 4800
%2009 = torch.prim.ListConstruct %int1_1317, %int7_1318, %int4800_1319 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2010 = torch.aten.reshape %2007, %2009 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2011 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2012 = torch.prim.tolist(%2011) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1320 = torch.constant.int 2
%2013 = torch.aten.split_with_sizes %2010, %2012, %int2_1320 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2014:3 = torch.prim.ListUnpack %2013 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2015 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1321 = torch.constant.int 1
%int7_1322 = torch.constant.int 7
%int25_1323 = torch.constant.int 25
%int64_1324 = torch.constant.int 64
%2016 = torch.prim.ListConstruct %int1_1321, %int7_1322, %int25_1323, %int64_1324 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2017 = torch.aten.reshape %2014#0, %2016 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1325 = torch.constant.int 1
%int2_1326 = torch.constant.int 2
%2018 = torch.aten.transpose.int %2017, %int1_1325, %int2_1326 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2019 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1327 = torch.constant.int 1
%int7_1328 = torch.constant.int 7
%int25_1329 = torch.constant.int 25
%int64_1330 = torch.constant.int 64
%2020 = torch.prim.ListConstruct %int1_1327, %int7_1328, %int25_1329, %int64_1330 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2021 = torch.aten.reshape %2014#1, %2020 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1331 = torch.constant.int 1
%int2_1332 = torch.constant.int 2
%2022 = torch.aten.transpose.int %2021, %int1_1331, %int2_1332 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2023 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1333 = torch.constant.int 1
%int7_1334 = torch.constant.int 7
%int25_1335 = torch.constant.int 25
%int64_1336 = torch.constant.int 64
%2024 = torch.prim.ListConstruct %int1_1333, %int7_1334, %int25_1335, %int64_1336 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2025 = torch.aten.reshape %2014#2, %2024 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1337 = torch.constant.int 1
%int2_1338 = torch.constant.int 2
%2026 = torch.aten.transpose.int %2025, %int1_1337, %int2_1338 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1339 = torch.constant.int 1
%int2_1340 = torch.constant.int 2
%2027 = torch.aten.transpose.int %2021, %int1_1339, %int2_1340 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1341 = torch.constant.int 2
%int3_1342 = torch.constant.int 3
%2028 = torch.aten.transpose.int %2027, %int2_1341, %int3_1342 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2029 = torch.aten.matmul %2018, %2028 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2030 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2031 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2032 = torch.aten.pow.Tensor_Tensor %2030, %2031 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2033 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1343 = torch.constant.int 0
%2034 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1344 = torch.constant.none
%float0.000000e00_1345 = torch.constant.float 0.000000e+00
%2035 = torch.aten.full %2034, %float0.000000e00_1345, %none_1344, %none_1344, %none_1344, %none_1344 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1346 = torch.constant.int 1
%2036 = torch.aten.add.Tensor %2035, %2032, %int1_1346 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2037 = torch.aten.div.Tensor %2029, %2036 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2038 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1347 = torch.constant.int 6
%none_1348 = torch.constant.none
%false_1349 = torch.constant.bool false
%2039 = torch.aten.to.dtype %2037, %int6_1347, %false_1349, %false_1349, %none_1348 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2040 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2041 = torch.aten.where.self %2038, %2039, %2040 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1350 = torch.constant.int 3
%none_1351 = torch.constant.none
%2042 = torch.aten.softmax.int %2041, %int3_1350, %none_1351 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1352 = torch.constant.int 6
%none_1353 = torch.constant.none
%false_1354 = torch.constant.bool false
%2043 = torch.aten.to.dtype %2042, %int6_1352, %false_1354, %false_1354, %none_1353 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2044 = torch.aten.matmul %2043, %2026 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1355 = torch.constant.int 1
%int2_1356 = torch.constant.int 2
%2045 = torch.aten.transpose.int %2044, %int1_1355, %int2_1356 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2046 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1357 = torch.constant.int 1
%int7_1358 = torch.constant.int 7
%int1600_1359 = torch.constant.int 1600
%2047 = torch.prim.ListConstruct %int1_1357, %int7_1358, %int1600_1359 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2048 = torch.aten.reshape %2045, %2047 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2049 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1360 = torch.constant.int 7
%int1600_1361 = torch.constant.int 1600
%2050 = torch.prim.ListConstruct %int7_1360, %int1600_1361 : (!torch.int, !torch.int) -> !torch.list<int>
%2051 = torch.aten.reshape %2048, %2050 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1362 = torch.constant.int 0
%int1_1363 = torch.constant.int 1
%2052 = torch.aten.mm %2051, %198 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2053 = torch.aten.add.Tensor %2052, %199, %int1_1363 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2054 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1364 = torch.constant.int 1
%int7_1365 = torch.constant.int 7
%int1600_1366 = torch.constant.int 1600
%2055 = torch.prim.ListConstruct %int1_1364, %int7_1365, %int1600_1366 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2056 = torch.aten.reshape %2053, %2055 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1367 = torch.constant.int 1
%2057 = torch.aten.add.Tensor %2056, %2001, %int1_1367 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1368 = torch.constant.float 9.9999997473787516E-6
%int1600_1369 = torch.constant.int 1600
%2058 = torch.prim.ListConstruct %int1600_1369 : (!torch.int) -> !torch.list<int>
%result0_1370, %result1_1371, %result2_1372 = torch.aten.native_layer_norm %2057, %2058, %200, %201, %float9.999990e-06_1368 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2059 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1373 = torch.constant.int 7
%int1600_1374 = torch.constant.int 1600
%2060 = torch.prim.ListConstruct %int7_1373, %int1600_1374 : (!torch.int, !torch.int) -> !torch.list<int>
%2061 = torch.aten.reshape %result0_1370, %2060 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1375 = torch.constant.int 0
%int1_1376 = torch.constant.int 1
%2062 = torch.aten.mm %2061, %202 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2063 = torch.aten.add.Tensor %2062, %203, %int1_1376 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2064 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1377 = torch.constant.int 1
%int7_1378 = torch.constant.int 7
%int6400_1379 = torch.constant.int 6400
%2065 = torch.prim.ListConstruct %int1_1377, %int7_1378, %int6400_1379 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2066 = torch.aten.reshape %2063, %2065 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2067 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2068 = torch.aten.mul.Tensor %2066, %2067 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2069 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2070 = torch.aten.pow.Tensor_Tensor %2066, %2069 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2071 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2072 = torch.aten.mul.Tensor %2070, %2071 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1380 = torch.constant.int 1
%2073 = torch.aten.add.Tensor %2066, %2072, %int1_1380 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2074 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2075 = torch.aten.mul.Tensor %2073, %2074 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2076 = torch.aten.tanh %2075 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2077 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1381 = torch.constant.int 1
%2078 = torch.aten.add.Tensor %2076, %2077, %int1_1381 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2079 = torch.aten.mul.Tensor %2068, %2078 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2080 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1382 = torch.constant.int 7
%int6400_1383 = torch.constant.int 6400
%2081 = torch.prim.ListConstruct %int7_1382, %int6400_1383 : (!torch.int, !torch.int) -> !torch.list<int>
%2082 = torch.aten.reshape %2079, %2081 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1384 = torch.constant.int 0
%int1_1385 = torch.constant.int 1
%2083 = torch.aten.mm %2082, %204 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2084 = torch.aten.add.Tensor %2083, %205, %int1_1385 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2085 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1386 = torch.constant.int 1
%int7_1387 = torch.constant.int 7
%int1600_1388 = torch.constant.int 1600
%2086 = torch.prim.ListConstruct %int1_1386, %int7_1387, %int1600_1388 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2087 = torch.aten.reshape %2084, %2086 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1389 = torch.constant.int 1
%2088 = torch.aten.add.Tensor %2057, %2087, %int1_1389 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1390 = torch.constant.float 9.9999997473787516E-6
%int1600_1391 = torch.constant.int 1600
%2089 = torch.prim.ListConstruct %int1600_1391 : (!torch.int) -> !torch.list<int>
%result0_1392, %result1_1393, %result2_1394 = torch.aten.native_layer_norm %2088, %2089, %206, %207, %float9.999990e-06_1390 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2090 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1395 = torch.constant.int 7
%int1600_1396 = torch.constant.int 1600
%2091 = torch.prim.ListConstruct %int7_1395, %int1600_1396 : (!torch.int, !torch.int) -> !torch.list<int>
%2092 = torch.aten.reshape %result0_1392, %2091 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1397 = torch.constant.int 0
%int1_1398 = torch.constant.int 1
%2093 = torch.aten.mm %2092, %208 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2094 = torch.aten.add.Tensor %2093, %209, %int1_1398 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2095 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1399 = torch.constant.int 1
%int7_1400 = torch.constant.int 7
%int4800_1401 = torch.constant.int 4800
%2096 = torch.prim.ListConstruct %int1_1399, %int7_1400, %int4800_1401 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2097 = torch.aten.reshape %2094, %2096 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2098 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2099 = torch.prim.tolist(%2098) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1402 = torch.constant.int 2
%2100 = torch.aten.split_with_sizes %2097, %2099, %int2_1402 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2101:3 = torch.prim.ListUnpack %2100 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2102 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1403 = torch.constant.int 1
%int7_1404 = torch.constant.int 7
%int25_1405 = torch.constant.int 25
%int64_1406 = torch.constant.int 64
%2103 = torch.prim.ListConstruct %int1_1403, %int7_1404, %int25_1405, %int64_1406 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2104 = torch.aten.reshape %2101#0, %2103 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1407 = torch.constant.int 1
%int2_1408 = torch.constant.int 2
%2105 = torch.aten.transpose.int %2104, %int1_1407, %int2_1408 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2106 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1409 = torch.constant.int 1
%int7_1410 = torch.constant.int 7
%int25_1411 = torch.constant.int 25
%int64_1412 = torch.constant.int 64
%2107 = torch.prim.ListConstruct %int1_1409, %int7_1410, %int25_1411, %int64_1412 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2108 = torch.aten.reshape %2101#1, %2107 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1413 = torch.constant.int 1
%int2_1414 = torch.constant.int 2
%2109 = torch.aten.transpose.int %2108, %int1_1413, %int2_1414 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2110 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1415 = torch.constant.int 1
%int7_1416 = torch.constant.int 7
%int25_1417 = torch.constant.int 25
%int64_1418 = torch.constant.int 64
%2111 = torch.prim.ListConstruct %int1_1415, %int7_1416, %int25_1417, %int64_1418 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2112 = torch.aten.reshape %2101#2, %2111 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1419 = torch.constant.int 1
%int2_1420 = torch.constant.int 2
%2113 = torch.aten.transpose.int %2112, %int1_1419, %int2_1420 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1421 = torch.constant.int 1
%int2_1422 = torch.constant.int 2
%2114 = torch.aten.transpose.int %2108, %int1_1421, %int2_1422 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1423 = torch.constant.int 2
%int3_1424 = torch.constant.int 3
%2115 = torch.aten.transpose.int %2114, %int2_1423, %int3_1424 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2116 = torch.aten.matmul %2105, %2115 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2117 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2118 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2119 = torch.aten.pow.Tensor_Tensor %2117, %2118 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2120 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1425 = torch.constant.int 0
%2121 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1426 = torch.constant.none
%float0.000000e00_1427 = torch.constant.float 0.000000e+00
%2122 = torch.aten.full %2121, %float0.000000e00_1427, %none_1426, %none_1426, %none_1426, %none_1426 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1428 = torch.constant.int 1
%2123 = torch.aten.add.Tensor %2122, %2119, %int1_1428 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2124 = torch.aten.div.Tensor %2116, %2123 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2125 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1429 = torch.constant.int 6
%none_1430 = torch.constant.none
%false_1431 = torch.constant.bool false
%2126 = torch.aten.to.dtype %2124, %int6_1429, %false_1431, %false_1431, %none_1430 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2127 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2128 = torch.aten.where.self %2125, %2126, %2127 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1432 = torch.constant.int 3
%none_1433 = torch.constant.none
%2129 = torch.aten.softmax.int %2128, %int3_1432, %none_1433 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1434 = torch.constant.int 6
%none_1435 = torch.constant.none
%false_1436 = torch.constant.bool false
%2130 = torch.aten.to.dtype %2129, %int6_1434, %false_1436, %false_1436, %none_1435 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2131 = torch.aten.matmul %2130, %2113 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1437 = torch.constant.int 1
%int2_1438 = torch.constant.int 2
%2132 = torch.aten.transpose.int %2131, %int1_1437, %int2_1438 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2133 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1439 = torch.constant.int 1
%int7_1440 = torch.constant.int 7
%int1600_1441 = torch.constant.int 1600
%2134 = torch.prim.ListConstruct %int1_1439, %int7_1440, %int1600_1441 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2135 = torch.aten.reshape %2132, %2134 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2136 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1442 = torch.constant.int 7
%int1600_1443 = torch.constant.int 1600
%2137 = torch.prim.ListConstruct %int7_1442, %int1600_1443 : (!torch.int, !torch.int) -> !torch.list<int>
%2138 = torch.aten.reshape %2135, %2137 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1444 = torch.constant.int 0
%int1_1445 = torch.constant.int 1
%2139 = torch.aten.mm %2138, %210 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2140 = torch.aten.add.Tensor %2139, %211, %int1_1445 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2141 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1446 = torch.constant.int 1
%int7_1447 = torch.constant.int 7
%int1600_1448 = torch.constant.int 1600
%2142 = torch.prim.ListConstruct %int1_1446, %int7_1447, %int1600_1448 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2143 = torch.aten.reshape %2140, %2142 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1449 = torch.constant.int 1
%2144 = torch.aten.add.Tensor %2143, %2088, %int1_1449 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1450 = torch.constant.float 9.9999997473787516E-6
%int1600_1451 = torch.constant.int 1600
%2145 = torch.prim.ListConstruct %int1600_1451 : (!torch.int) -> !torch.list<int>
%result0_1452, %result1_1453, %result2_1454 = torch.aten.native_layer_norm %2144, %2145, %212, %213, %float9.999990e-06_1450 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2146 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1455 = torch.constant.int 7
%int1600_1456 = torch.constant.int 1600
%2147 = torch.prim.ListConstruct %int7_1455, %int1600_1456 : (!torch.int, !torch.int) -> !torch.list<int>
%2148 = torch.aten.reshape %result0_1452, %2147 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1457 = torch.constant.int 0
%int1_1458 = torch.constant.int 1
%2149 = torch.aten.mm %2148, %214 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2150 = torch.aten.add.Tensor %2149, %215, %int1_1458 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2151 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1459 = torch.constant.int 1
%int7_1460 = torch.constant.int 7
%int6400_1461 = torch.constant.int 6400
%2152 = torch.prim.ListConstruct %int1_1459, %int7_1460, %int6400_1461 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2153 = torch.aten.reshape %2150, %2152 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2154 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2155 = torch.aten.mul.Tensor %2153, %2154 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2156 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2157 = torch.aten.pow.Tensor_Tensor %2153, %2156 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2158 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2159 = torch.aten.mul.Tensor %2157, %2158 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1462 = torch.constant.int 1
%2160 = torch.aten.add.Tensor %2153, %2159, %int1_1462 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2161 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2162 = torch.aten.mul.Tensor %2160, %2161 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2163 = torch.aten.tanh %2162 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2164 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1463 = torch.constant.int 1
%2165 = torch.aten.add.Tensor %2163, %2164, %int1_1463 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2166 = torch.aten.mul.Tensor %2155, %2165 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2167 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1464 = torch.constant.int 7
%int6400_1465 = torch.constant.int 6400
%2168 = torch.prim.ListConstruct %int7_1464, %int6400_1465 : (!torch.int, !torch.int) -> !torch.list<int>
%2169 = torch.aten.reshape %2166, %2168 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1466 = torch.constant.int 0
%int1_1467 = torch.constant.int 1
%2170 = torch.aten.mm %2169, %216 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2171 = torch.aten.add.Tensor %2170, %217, %int1_1467 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2172 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1468 = torch.constant.int 1
%int7_1469 = torch.constant.int 7
%int1600_1470 = torch.constant.int 1600
%2173 = torch.prim.ListConstruct %int1_1468, %int7_1469, %int1600_1470 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2174 = torch.aten.reshape %2171, %2173 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1471 = torch.constant.int 1
%2175 = torch.aten.add.Tensor %2144, %2174, %int1_1471 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1472 = torch.constant.float 9.9999997473787516E-6
%int1600_1473 = torch.constant.int 1600
%2176 = torch.prim.ListConstruct %int1600_1473 : (!torch.int) -> !torch.list<int>
%result0_1474, %result1_1475, %result2_1476 = torch.aten.native_layer_norm %2175, %2176, %218, %219, %float9.999990e-06_1472 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2177 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1477 = torch.constant.int 7
%int1600_1478 = torch.constant.int 1600
%2178 = torch.prim.ListConstruct %int7_1477, %int1600_1478 : (!torch.int, !torch.int) -> !torch.list<int>
%2179 = torch.aten.reshape %result0_1474, %2178 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1479 = torch.constant.int 0
%int1_1480 = torch.constant.int 1
%2180 = torch.aten.mm %2179, %220 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2181 = torch.aten.add.Tensor %2180, %221, %int1_1480 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2182 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1481 = torch.constant.int 1
%int7_1482 = torch.constant.int 7
%int4800_1483 = torch.constant.int 4800
%2183 = torch.prim.ListConstruct %int1_1481, %int7_1482, %int4800_1483 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2184 = torch.aten.reshape %2181, %2183 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2185 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2186 = torch.prim.tolist(%2185) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1484 = torch.constant.int 2
%2187 = torch.aten.split_with_sizes %2184, %2186, %int2_1484 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2188:3 = torch.prim.ListUnpack %2187 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2189 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1485 = torch.constant.int 1
%int7_1486 = torch.constant.int 7
%int25_1487 = torch.constant.int 25
%int64_1488 = torch.constant.int 64
%2190 = torch.prim.ListConstruct %int1_1485, %int7_1486, %int25_1487, %int64_1488 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2191 = torch.aten.reshape %2188#0, %2190 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1489 = torch.constant.int 1
%int2_1490 = torch.constant.int 2
%2192 = torch.aten.transpose.int %2191, %int1_1489, %int2_1490 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2193 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1491 = torch.constant.int 1
%int7_1492 = torch.constant.int 7
%int25_1493 = torch.constant.int 25
%int64_1494 = torch.constant.int 64
%2194 = torch.prim.ListConstruct %int1_1491, %int7_1492, %int25_1493, %int64_1494 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2195 = torch.aten.reshape %2188#1, %2194 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1495 = torch.constant.int 1
%int2_1496 = torch.constant.int 2
%2196 = torch.aten.transpose.int %2195, %int1_1495, %int2_1496 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2197 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1497 = torch.constant.int 1
%int7_1498 = torch.constant.int 7
%int25_1499 = torch.constant.int 25
%int64_1500 = torch.constant.int 64
%2198 = torch.prim.ListConstruct %int1_1497, %int7_1498, %int25_1499, %int64_1500 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2199 = torch.aten.reshape %2188#2, %2198 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1501 = torch.constant.int 1
%int2_1502 = torch.constant.int 2
%2200 = torch.aten.transpose.int %2199, %int1_1501, %int2_1502 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1503 = torch.constant.int 1
%int2_1504 = torch.constant.int 2
%2201 = torch.aten.transpose.int %2195, %int1_1503, %int2_1504 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1505 = torch.constant.int 2
%int3_1506 = torch.constant.int 3
%2202 = torch.aten.transpose.int %2201, %int2_1505, %int3_1506 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2203 = torch.aten.matmul %2192, %2202 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2204 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2205 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2206 = torch.aten.pow.Tensor_Tensor %2204, %2205 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2207 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1507 = torch.constant.int 0
%2208 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1508 = torch.constant.none
%float0.000000e00_1509 = torch.constant.float 0.000000e+00
%2209 = torch.aten.full %2208, %float0.000000e00_1509, %none_1508, %none_1508, %none_1508, %none_1508 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1510 = torch.constant.int 1
%2210 = torch.aten.add.Tensor %2209, %2206, %int1_1510 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2211 = torch.aten.div.Tensor %2203, %2210 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2212 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1511 = torch.constant.int 6
%none_1512 = torch.constant.none
%false_1513 = torch.constant.bool false
%2213 = torch.aten.to.dtype %2211, %int6_1511, %false_1513, %false_1513, %none_1512 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2214 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2215 = torch.aten.where.self %2212, %2213, %2214 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1514 = torch.constant.int 3
%none_1515 = torch.constant.none
%2216 = torch.aten.softmax.int %2215, %int3_1514, %none_1515 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1516 = torch.constant.int 6
%none_1517 = torch.constant.none
%false_1518 = torch.constant.bool false
%2217 = torch.aten.to.dtype %2216, %int6_1516, %false_1518, %false_1518, %none_1517 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2218 = torch.aten.matmul %2217, %2200 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1519 = torch.constant.int 1
%int2_1520 = torch.constant.int 2
%2219 = torch.aten.transpose.int %2218, %int1_1519, %int2_1520 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2220 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1521 = torch.constant.int 1
%int7_1522 = torch.constant.int 7
%int1600_1523 = torch.constant.int 1600
%2221 = torch.prim.ListConstruct %int1_1521, %int7_1522, %int1600_1523 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2222 = torch.aten.reshape %2219, %2221 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2223 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1524 = torch.constant.int 7
%int1600_1525 = torch.constant.int 1600
%2224 = torch.prim.ListConstruct %int7_1524, %int1600_1525 : (!torch.int, !torch.int) -> !torch.list<int>
%2225 = torch.aten.reshape %2222, %2224 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1526 = torch.constant.int 0
%int1_1527 = torch.constant.int 1
%2226 = torch.aten.mm %2225, %222 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2227 = torch.aten.add.Tensor %2226, %223, %int1_1527 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2228 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1528 = torch.constant.int 1
%int7_1529 = torch.constant.int 7
%int1600_1530 = torch.constant.int 1600
%2229 = torch.prim.ListConstruct %int1_1528, %int7_1529, %int1600_1530 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2230 = torch.aten.reshape %2227, %2229 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1531 = torch.constant.int 1
%2231 = torch.aten.add.Tensor %2230, %2175, %int1_1531 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1532 = torch.constant.float 9.9999997473787516E-6
%int1600_1533 = torch.constant.int 1600
%2232 = torch.prim.ListConstruct %int1600_1533 : (!torch.int) -> !torch.list<int>
%result0_1534, %result1_1535, %result2_1536 = torch.aten.native_layer_norm %2231, %2232, %224, %225, %float9.999990e-06_1532 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2233 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1537 = torch.constant.int 7
%int1600_1538 = torch.constant.int 1600
%2234 = torch.prim.ListConstruct %int7_1537, %int1600_1538 : (!torch.int, !torch.int) -> !torch.list<int>
%2235 = torch.aten.reshape %result0_1534, %2234 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1539 = torch.constant.int 0
%int1_1540 = torch.constant.int 1
%2236 = torch.aten.mm %2235, %226 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2237 = torch.aten.add.Tensor %2236, %227, %int1_1540 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2238 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1541 = torch.constant.int 1
%int7_1542 = torch.constant.int 7
%int6400_1543 = torch.constant.int 6400
%2239 = torch.prim.ListConstruct %int1_1541, %int7_1542, %int6400_1543 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2240 = torch.aten.reshape %2237, %2239 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2241 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2242 = torch.aten.mul.Tensor %2240, %2241 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2243 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2244 = torch.aten.pow.Tensor_Tensor %2240, %2243 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2245 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2246 = torch.aten.mul.Tensor %2244, %2245 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1544 = torch.constant.int 1
%2247 = torch.aten.add.Tensor %2240, %2246, %int1_1544 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2248 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2249 = torch.aten.mul.Tensor %2247, %2248 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2250 = torch.aten.tanh %2249 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2251 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1545 = torch.constant.int 1
%2252 = torch.aten.add.Tensor %2250, %2251, %int1_1545 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2253 = torch.aten.mul.Tensor %2242, %2252 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2254 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1546 = torch.constant.int 7
%int6400_1547 = torch.constant.int 6400
%2255 = torch.prim.ListConstruct %int7_1546, %int6400_1547 : (!torch.int, !torch.int) -> !torch.list<int>
%2256 = torch.aten.reshape %2253, %2255 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1548 = torch.constant.int 0
%int1_1549 = torch.constant.int 1
%2257 = torch.aten.mm %2256, %228 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2258 = torch.aten.add.Tensor %2257, %229, %int1_1549 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2259 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1550 = torch.constant.int 1
%int7_1551 = torch.constant.int 7
%int1600_1552 = torch.constant.int 1600
%2260 = torch.prim.ListConstruct %int1_1550, %int7_1551, %int1600_1552 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2261 = torch.aten.reshape %2258, %2260 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1553 = torch.constant.int 1
%2262 = torch.aten.add.Tensor %2231, %2261, %int1_1553 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1554 = torch.constant.float 9.9999997473787516E-6
%int1600_1555 = torch.constant.int 1600
%2263 = torch.prim.ListConstruct %int1600_1555 : (!torch.int) -> !torch.list<int>
%result0_1556, %result1_1557, %result2_1558 = torch.aten.native_layer_norm %2262, %2263, %230, %231, %float9.999990e-06_1554 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2264 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1559 = torch.constant.int 7
%int1600_1560 = torch.constant.int 1600
%2265 = torch.prim.ListConstruct %int7_1559, %int1600_1560 : (!torch.int, !torch.int) -> !torch.list<int>
%2266 = torch.aten.reshape %result0_1556, %2265 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1561 = torch.constant.int 0
%int1_1562 = torch.constant.int 1
%2267 = torch.aten.mm %2266, %232 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2268 = torch.aten.add.Tensor %2267, %233, %int1_1562 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2269 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1563 = torch.constant.int 1
%int7_1564 = torch.constant.int 7
%int4800_1565 = torch.constant.int 4800
%2270 = torch.prim.ListConstruct %int1_1563, %int7_1564, %int4800_1565 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2271 = torch.aten.reshape %2268, %2270 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2272 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2273 = torch.prim.tolist(%2272) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1566 = torch.constant.int 2
%2274 = torch.aten.split_with_sizes %2271, %2273, %int2_1566 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2275:3 = torch.prim.ListUnpack %2274 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2276 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1567 = torch.constant.int 1
%int7_1568 = torch.constant.int 7
%int25_1569 = torch.constant.int 25
%int64_1570 = torch.constant.int 64
%2277 = torch.prim.ListConstruct %int1_1567, %int7_1568, %int25_1569, %int64_1570 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2278 = torch.aten.reshape %2275#0, %2277 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1571 = torch.constant.int 1
%int2_1572 = torch.constant.int 2
%2279 = torch.aten.transpose.int %2278, %int1_1571, %int2_1572 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2280 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1573 = torch.constant.int 1
%int7_1574 = torch.constant.int 7
%int25_1575 = torch.constant.int 25
%int64_1576 = torch.constant.int 64
%2281 = torch.prim.ListConstruct %int1_1573, %int7_1574, %int25_1575, %int64_1576 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2282 = torch.aten.reshape %2275#1, %2281 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1577 = torch.constant.int 1
%int2_1578 = torch.constant.int 2
%2283 = torch.aten.transpose.int %2282, %int1_1577, %int2_1578 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2284 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1579 = torch.constant.int 1
%int7_1580 = torch.constant.int 7
%int25_1581 = torch.constant.int 25
%int64_1582 = torch.constant.int 64
%2285 = torch.prim.ListConstruct %int1_1579, %int7_1580, %int25_1581, %int64_1582 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2286 = torch.aten.reshape %2275#2, %2285 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1583 = torch.constant.int 1
%int2_1584 = torch.constant.int 2
%2287 = torch.aten.transpose.int %2286, %int1_1583, %int2_1584 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1585 = torch.constant.int 1
%int2_1586 = torch.constant.int 2
%2288 = torch.aten.transpose.int %2282, %int1_1585, %int2_1586 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1587 = torch.constant.int 2
%int3_1588 = torch.constant.int 3
%2289 = torch.aten.transpose.int %2288, %int2_1587, %int3_1588 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2290 = torch.aten.matmul %2279, %2289 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2291 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2292 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2293 = torch.aten.pow.Tensor_Tensor %2291, %2292 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2294 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1589 = torch.constant.int 0
%2295 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1590 = torch.constant.none
%float0.000000e00_1591 = torch.constant.float 0.000000e+00
%2296 = torch.aten.full %2295, %float0.000000e00_1591, %none_1590, %none_1590, %none_1590, %none_1590 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1592 = torch.constant.int 1
%2297 = torch.aten.add.Tensor %2296, %2293, %int1_1592 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2298 = torch.aten.div.Tensor %2290, %2297 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2299 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1593 = torch.constant.int 6
%none_1594 = torch.constant.none
%false_1595 = torch.constant.bool false
%2300 = torch.aten.to.dtype %2298, %int6_1593, %false_1595, %false_1595, %none_1594 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2301 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2302 = torch.aten.where.self %2299, %2300, %2301 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1596 = torch.constant.int 3
%none_1597 = torch.constant.none
%2303 = torch.aten.softmax.int %2302, %int3_1596, %none_1597 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1598 = torch.constant.int 6
%none_1599 = torch.constant.none
%false_1600 = torch.constant.bool false
%2304 = torch.aten.to.dtype %2303, %int6_1598, %false_1600, %false_1600, %none_1599 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2305 = torch.aten.matmul %2304, %2287 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1601 = torch.constant.int 1
%int2_1602 = torch.constant.int 2
%2306 = torch.aten.transpose.int %2305, %int1_1601, %int2_1602 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2307 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1603 = torch.constant.int 1
%int7_1604 = torch.constant.int 7
%int1600_1605 = torch.constant.int 1600
%2308 = torch.prim.ListConstruct %int1_1603, %int7_1604, %int1600_1605 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2309 = torch.aten.reshape %2306, %2308 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2310 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1606 = torch.constant.int 7
%int1600_1607 = torch.constant.int 1600
%2311 = torch.prim.ListConstruct %int7_1606, %int1600_1607 : (!torch.int, !torch.int) -> !torch.list<int>
%2312 = torch.aten.reshape %2309, %2311 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1608 = torch.constant.int 0
%int1_1609 = torch.constant.int 1
%2313 = torch.aten.mm %2312, %234 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2314 = torch.aten.add.Tensor %2313, %235, %int1_1609 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2315 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1610 = torch.constant.int 1
%int7_1611 = torch.constant.int 7
%int1600_1612 = torch.constant.int 1600
%2316 = torch.prim.ListConstruct %int1_1610, %int7_1611, %int1600_1612 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2317 = torch.aten.reshape %2314, %2316 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1613 = torch.constant.int 1
%2318 = torch.aten.add.Tensor %2317, %2262, %int1_1613 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1614 = torch.constant.float 9.9999997473787516E-6
%int1600_1615 = torch.constant.int 1600
%2319 = torch.prim.ListConstruct %int1600_1615 : (!torch.int) -> !torch.list<int>
%result0_1616, %result1_1617, %result2_1618 = torch.aten.native_layer_norm %2318, %2319, %236, %237, %float9.999990e-06_1614 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2320 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1619 = torch.constant.int 7
%int1600_1620 = torch.constant.int 1600
%2321 = torch.prim.ListConstruct %int7_1619, %int1600_1620 : (!torch.int, !torch.int) -> !torch.list<int>
%2322 = torch.aten.reshape %result0_1616, %2321 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1621 = torch.constant.int 0
%int1_1622 = torch.constant.int 1
%2323 = torch.aten.mm %2322, %238 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2324 = torch.aten.add.Tensor %2323, %239, %int1_1622 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2325 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1623 = torch.constant.int 1
%int7_1624 = torch.constant.int 7
%int6400_1625 = torch.constant.int 6400
%2326 = torch.prim.ListConstruct %int1_1623, %int7_1624, %int6400_1625 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2327 = torch.aten.reshape %2324, %2326 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2328 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2329 = torch.aten.mul.Tensor %2327, %2328 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2330 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2331 = torch.aten.pow.Tensor_Tensor %2327, %2330 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2332 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2333 = torch.aten.mul.Tensor %2331, %2332 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1626 = torch.constant.int 1
%2334 = torch.aten.add.Tensor %2327, %2333, %int1_1626 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2335 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2336 = torch.aten.mul.Tensor %2334, %2335 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2337 = torch.aten.tanh %2336 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2338 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1627 = torch.constant.int 1
%2339 = torch.aten.add.Tensor %2337, %2338, %int1_1627 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2340 = torch.aten.mul.Tensor %2329, %2339 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2341 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1628 = torch.constant.int 7
%int6400_1629 = torch.constant.int 6400
%2342 = torch.prim.ListConstruct %int7_1628, %int6400_1629 : (!torch.int, !torch.int) -> !torch.list<int>
%2343 = torch.aten.reshape %2340, %2342 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1630 = torch.constant.int 0
%int1_1631 = torch.constant.int 1
%2344 = torch.aten.mm %2343, %240 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2345 = torch.aten.add.Tensor %2344, %241, %int1_1631 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2346 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1632 = torch.constant.int 1
%int7_1633 = torch.constant.int 7
%int1600_1634 = torch.constant.int 1600
%2347 = torch.prim.ListConstruct %int1_1632, %int7_1633, %int1600_1634 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2348 = torch.aten.reshape %2345, %2347 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1635 = torch.constant.int 1
%2349 = torch.aten.add.Tensor %2318, %2348, %int1_1635 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1636 = torch.constant.float 9.9999997473787516E-6
%int1600_1637 = torch.constant.int 1600
%2350 = torch.prim.ListConstruct %int1600_1637 : (!torch.int) -> !torch.list<int>
%result0_1638, %result1_1639, %result2_1640 = torch.aten.native_layer_norm %2349, %2350, %242, %243, %float9.999990e-06_1636 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2351 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1641 = torch.constant.int 7
%int1600_1642 = torch.constant.int 1600
%2352 = torch.prim.ListConstruct %int7_1641, %int1600_1642 : (!torch.int, !torch.int) -> !torch.list<int>
%2353 = torch.aten.reshape %result0_1638, %2352 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1643 = torch.constant.int 0
%int1_1644 = torch.constant.int 1
%2354 = torch.aten.mm %2353, %244 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2355 = torch.aten.add.Tensor %2354, %245, %int1_1644 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2356 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1645 = torch.constant.int 1
%int7_1646 = torch.constant.int 7
%int4800_1647 = torch.constant.int 4800
%2357 = torch.prim.ListConstruct %int1_1645, %int7_1646, %int4800_1647 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2358 = torch.aten.reshape %2355, %2357 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2359 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2360 = torch.prim.tolist(%2359) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1648 = torch.constant.int 2
%2361 = torch.aten.split_with_sizes %2358, %2360, %int2_1648 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2362:3 = torch.prim.ListUnpack %2361 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2363 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1649 = torch.constant.int 1
%int7_1650 = torch.constant.int 7
%int25_1651 = torch.constant.int 25
%int64_1652 = torch.constant.int 64
%2364 = torch.prim.ListConstruct %int1_1649, %int7_1650, %int25_1651, %int64_1652 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2365 = torch.aten.reshape %2362#0, %2364 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1653 = torch.constant.int 1
%int2_1654 = torch.constant.int 2
%2366 = torch.aten.transpose.int %2365, %int1_1653, %int2_1654 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2367 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1655 = torch.constant.int 1
%int7_1656 = torch.constant.int 7
%int25_1657 = torch.constant.int 25
%int64_1658 = torch.constant.int 64
%2368 = torch.prim.ListConstruct %int1_1655, %int7_1656, %int25_1657, %int64_1658 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2369 = torch.aten.reshape %2362#1, %2368 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1659 = torch.constant.int 1
%int2_1660 = torch.constant.int 2
%2370 = torch.aten.transpose.int %2369, %int1_1659, %int2_1660 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2371 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1661 = torch.constant.int 1
%int7_1662 = torch.constant.int 7
%int25_1663 = torch.constant.int 25
%int64_1664 = torch.constant.int 64
%2372 = torch.prim.ListConstruct %int1_1661, %int7_1662, %int25_1663, %int64_1664 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2373 = torch.aten.reshape %2362#2, %2372 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1665 = torch.constant.int 1
%int2_1666 = torch.constant.int 2
%2374 = torch.aten.transpose.int %2373, %int1_1665, %int2_1666 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1667 = torch.constant.int 1
%int2_1668 = torch.constant.int 2
%2375 = torch.aten.transpose.int %2369, %int1_1667, %int2_1668 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1669 = torch.constant.int 2
%int3_1670 = torch.constant.int 3
%2376 = torch.aten.transpose.int %2375, %int2_1669, %int3_1670 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2377 = torch.aten.matmul %2366, %2376 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2378 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2379 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2380 = torch.aten.pow.Tensor_Tensor %2378, %2379 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2381 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1671 = torch.constant.int 0
%2382 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1672 = torch.constant.none
%float0.000000e00_1673 = torch.constant.float 0.000000e+00
%2383 = torch.aten.full %2382, %float0.000000e00_1673, %none_1672, %none_1672, %none_1672, %none_1672 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1674 = torch.constant.int 1
%2384 = torch.aten.add.Tensor %2383, %2380, %int1_1674 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2385 = torch.aten.div.Tensor %2377, %2384 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2386 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1675 = torch.constant.int 6
%none_1676 = torch.constant.none
%false_1677 = torch.constant.bool false
%2387 = torch.aten.to.dtype %2385, %int6_1675, %false_1677, %false_1677, %none_1676 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2388 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2389 = torch.aten.where.self %2386, %2387, %2388 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1678 = torch.constant.int 3
%none_1679 = torch.constant.none
%2390 = torch.aten.softmax.int %2389, %int3_1678, %none_1679 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1680 = torch.constant.int 6
%none_1681 = torch.constant.none
%false_1682 = torch.constant.bool false
%2391 = torch.aten.to.dtype %2390, %int6_1680, %false_1682, %false_1682, %none_1681 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2392 = torch.aten.matmul %2391, %2374 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1683 = torch.constant.int 1
%int2_1684 = torch.constant.int 2
%2393 = torch.aten.transpose.int %2392, %int1_1683, %int2_1684 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2394 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1685 = torch.constant.int 1
%int7_1686 = torch.constant.int 7
%int1600_1687 = torch.constant.int 1600
%2395 = torch.prim.ListConstruct %int1_1685, %int7_1686, %int1600_1687 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2396 = torch.aten.reshape %2393, %2395 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2397 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1688 = torch.constant.int 7
%int1600_1689 = torch.constant.int 1600
%2398 = torch.prim.ListConstruct %int7_1688, %int1600_1689 : (!torch.int, !torch.int) -> !torch.list<int>
%2399 = torch.aten.reshape %2396, %2398 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1690 = torch.constant.int 0
%int1_1691 = torch.constant.int 1
%2400 = torch.aten.mm %2399, %246 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2401 = torch.aten.add.Tensor %2400, %247, %int1_1691 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2402 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1692 = torch.constant.int 1
%int7_1693 = torch.constant.int 7
%int1600_1694 = torch.constant.int 1600
%2403 = torch.prim.ListConstruct %int1_1692, %int7_1693, %int1600_1694 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2404 = torch.aten.reshape %2401, %2403 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1695 = torch.constant.int 1
%2405 = torch.aten.add.Tensor %2404, %2349, %int1_1695 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1696 = torch.constant.float 9.9999997473787516E-6
%int1600_1697 = torch.constant.int 1600
%2406 = torch.prim.ListConstruct %int1600_1697 : (!torch.int) -> !torch.list<int>
%result0_1698, %result1_1699, %result2_1700 = torch.aten.native_layer_norm %2405, %2406, %248, %249, %float9.999990e-06_1696 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2407 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1701 = torch.constant.int 7
%int1600_1702 = torch.constant.int 1600
%2408 = torch.prim.ListConstruct %int7_1701, %int1600_1702 : (!torch.int, !torch.int) -> !torch.list<int>
%2409 = torch.aten.reshape %result0_1698, %2408 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1703 = torch.constant.int 0
%int1_1704 = torch.constant.int 1
%2410 = torch.aten.mm %2409, %250 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2411 = torch.aten.add.Tensor %2410, %251, %int1_1704 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2412 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1705 = torch.constant.int 1
%int7_1706 = torch.constant.int 7
%int6400_1707 = torch.constant.int 6400
%2413 = torch.prim.ListConstruct %int1_1705, %int7_1706, %int6400_1707 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2414 = torch.aten.reshape %2411, %2413 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2415 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2416 = torch.aten.mul.Tensor %2414, %2415 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2417 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2418 = torch.aten.pow.Tensor_Tensor %2414, %2417 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2419 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2420 = torch.aten.mul.Tensor %2418, %2419 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1708 = torch.constant.int 1
%2421 = torch.aten.add.Tensor %2414, %2420, %int1_1708 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2422 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2423 = torch.aten.mul.Tensor %2421, %2422 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2424 = torch.aten.tanh %2423 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2425 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1709 = torch.constant.int 1
%2426 = torch.aten.add.Tensor %2424, %2425, %int1_1709 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2427 = torch.aten.mul.Tensor %2416, %2426 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2428 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1710 = torch.constant.int 7
%int6400_1711 = torch.constant.int 6400
%2429 = torch.prim.ListConstruct %int7_1710, %int6400_1711 : (!torch.int, !torch.int) -> !torch.list<int>
%2430 = torch.aten.reshape %2427, %2429 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1712 = torch.constant.int 0
%int1_1713 = torch.constant.int 1
%2431 = torch.aten.mm %2430, %252 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2432 = torch.aten.add.Tensor %2431, %253, %int1_1713 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2433 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1714 = torch.constant.int 1
%int7_1715 = torch.constant.int 7
%int1600_1716 = torch.constant.int 1600
%2434 = torch.prim.ListConstruct %int1_1714, %int7_1715, %int1600_1716 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2435 = torch.aten.reshape %2432, %2434 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1717 = torch.constant.int 1
%2436 = torch.aten.add.Tensor %2405, %2435, %int1_1717 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1718 = torch.constant.float 9.9999997473787516E-6
%int1600_1719 = torch.constant.int 1600
%2437 = torch.prim.ListConstruct %int1600_1719 : (!torch.int) -> !torch.list<int>
%result0_1720, %result1_1721, %result2_1722 = torch.aten.native_layer_norm %2436, %2437, %254, %255, %float9.999990e-06_1718 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2438 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1723 = torch.constant.int 7
%int1600_1724 = torch.constant.int 1600
%2439 = torch.prim.ListConstruct %int7_1723, %int1600_1724 : (!torch.int, !torch.int) -> !torch.list<int>
%2440 = torch.aten.reshape %result0_1720, %2439 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1725 = torch.constant.int 0
%int1_1726 = torch.constant.int 1
%2441 = torch.aten.mm %2440, %256 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2442 = torch.aten.add.Tensor %2441, %257, %int1_1726 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2443 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1727 = torch.constant.int 1
%int7_1728 = torch.constant.int 7
%int4800_1729 = torch.constant.int 4800
%2444 = torch.prim.ListConstruct %int1_1727, %int7_1728, %int4800_1729 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2445 = torch.aten.reshape %2442, %2444 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2446 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2447 = torch.prim.tolist(%2446) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1730 = torch.constant.int 2
%2448 = torch.aten.split_with_sizes %2445, %2447, %int2_1730 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2449:3 = torch.prim.ListUnpack %2448 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2450 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1731 = torch.constant.int 1
%int7_1732 = torch.constant.int 7
%int25_1733 = torch.constant.int 25
%int64_1734 = torch.constant.int 64
%2451 = torch.prim.ListConstruct %int1_1731, %int7_1732, %int25_1733, %int64_1734 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2452 = torch.aten.reshape %2449#0, %2451 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1735 = torch.constant.int 1
%int2_1736 = torch.constant.int 2
%2453 = torch.aten.transpose.int %2452, %int1_1735, %int2_1736 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2454 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1737 = torch.constant.int 1
%int7_1738 = torch.constant.int 7
%int25_1739 = torch.constant.int 25
%int64_1740 = torch.constant.int 64
%2455 = torch.prim.ListConstruct %int1_1737, %int7_1738, %int25_1739, %int64_1740 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2456 = torch.aten.reshape %2449#1, %2455 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1741 = torch.constant.int 1
%int2_1742 = torch.constant.int 2
%2457 = torch.aten.transpose.int %2456, %int1_1741, %int2_1742 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2458 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1743 = torch.constant.int 1
%int7_1744 = torch.constant.int 7
%int25_1745 = torch.constant.int 25
%int64_1746 = torch.constant.int 64
%2459 = torch.prim.ListConstruct %int1_1743, %int7_1744, %int25_1745, %int64_1746 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2460 = torch.aten.reshape %2449#2, %2459 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1747 = torch.constant.int 1
%int2_1748 = torch.constant.int 2
%2461 = torch.aten.transpose.int %2460, %int1_1747, %int2_1748 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1749 = torch.constant.int 1
%int2_1750 = torch.constant.int 2
%2462 = torch.aten.transpose.int %2456, %int1_1749, %int2_1750 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1751 = torch.constant.int 2
%int3_1752 = torch.constant.int 3
%2463 = torch.aten.transpose.int %2462, %int2_1751, %int3_1752 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2464 = torch.aten.matmul %2453, %2463 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2465 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2466 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2467 = torch.aten.pow.Tensor_Tensor %2465, %2466 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2468 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1753 = torch.constant.int 0
%2469 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1754 = torch.constant.none
%float0.000000e00_1755 = torch.constant.float 0.000000e+00
%2470 = torch.aten.full %2469, %float0.000000e00_1755, %none_1754, %none_1754, %none_1754, %none_1754 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1756 = torch.constant.int 1
%2471 = torch.aten.add.Tensor %2470, %2467, %int1_1756 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2472 = torch.aten.div.Tensor %2464, %2471 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2473 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1757 = torch.constant.int 6
%none_1758 = torch.constant.none
%false_1759 = torch.constant.bool false
%2474 = torch.aten.to.dtype %2472, %int6_1757, %false_1759, %false_1759, %none_1758 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2475 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2476 = torch.aten.where.self %2473, %2474, %2475 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1760 = torch.constant.int 3
%none_1761 = torch.constant.none
%2477 = torch.aten.softmax.int %2476, %int3_1760, %none_1761 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1762 = torch.constant.int 6
%none_1763 = torch.constant.none
%false_1764 = torch.constant.bool false
%2478 = torch.aten.to.dtype %2477, %int6_1762, %false_1764, %false_1764, %none_1763 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2479 = torch.aten.matmul %2478, %2461 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1765 = torch.constant.int 1
%int2_1766 = torch.constant.int 2
%2480 = torch.aten.transpose.int %2479, %int1_1765, %int2_1766 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2481 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1767 = torch.constant.int 1
%int7_1768 = torch.constant.int 7
%int1600_1769 = torch.constant.int 1600
%2482 = torch.prim.ListConstruct %int1_1767, %int7_1768, %int1600_1769 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2483 = torch.aten.reshape %2480, %2482 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2484 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1770 = torch.constant.int 7
%int1600_1771 = torch.constant.int 1600
%2485 = torch.prim.ListConstruct %int7_1770, %int1600_1771 : (!torch.int, !torch.int) -> !torch.list<int>
%2486 = torch.aten.reshape %2483, %2485 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1772 = torch.constant.int 0
%int1_1773 = torch.constant.int 1
%2487 = torch.aten.mm %2486, %258 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2488 = torch.aten.add.Tensor %2487, %259, %int1_1773 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2489 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1774 = torch.constant.int 1
%int7_1775 = torch.constant.int 7
%int1600_1776 = torch.constant.int 1600
%2490 = torch.prim.ListConstruct %int1_1774, %int7_1775, %int1600_1776 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2491 = torch.aten.reshape %2488, %2490 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1777 = torch.constant.int 1
%2492 = torch.aten.add.Tensor %2491, %2436, %int1_1777 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1778 = torch.constant.float 9.9999997473787516E-6
%int1600_1779 = torch.constant.int 1600
%2493 = torch.prim.ListConstruct %int1600_1779 : (!torch.int) -> !torch.list<int>
%result0_1780, %result1_1781, %result2_1782 = torch.aten.native_layer_norm %2492, %2493, %260, %261, %float9.999990e-06_1778 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2494 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1783 = torch.constant.int 7
%int1600_1784 = torch.constant.int 1600
%2495 = torch.prim.ListConstruct %int7_1783, %int1600_1784 : (!torch.int, !torch.int) -> !torch.list<int>
%2496 = torch.aten.reshape %result0_1780, %2495 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1785 = torch.constant.int 0
%int1_1786 = torch.constant.int 1
%2497 = torch.aten.mm %2496, %262 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2498 = torch.aten.add.Tensor %2497, %263, %int1_1786 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2499 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1787 = torch.constant.int 1
%int7_1788 = torch.constant.int 7
%int6400_1789 = torch.constant.int 6400
%2500 = torch.prim.ListConstruct %int1_1787, %int7_1788, %int6400_1789 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2501 = torch.aten.reshape %2498, %2500 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2502 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2503 = torch.aten.mul.Tensor %2501, %2502 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2504 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2505 = torch.aten.pow.Tensor_Tensor %2501, %2504 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2506 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2507 = torch.aten.mul.Tensor %2505, %2506 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1790 = torch.constant.int 1
%2508 = torch.aten.add.Tensor %2501, %2507, %int1_1790 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2509 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2510 = torch.aten.mul.Tensor %2508, %2509 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2511 = torch.aten.tanh %2510 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2512 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1791 = torch.constant.int 1
%2513 = torch.aten.add.Tensor %2511, %2512, %int1_1791 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2514 = torch.aten.mul.Tensor %2503, %2513 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2515 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1792 = torch.constant.int 7
%int6400_1793 = torch.constant.int 6400
%2516 = torch.prim.ListConstruct %int7_1792, %int6400_1793 : (!torch.int, !torch.int) -> !torch.list<int>
%2517 = torch.aten.reshape %2514, %2516 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1794 = torch.constant.int 0
%int1_1795 = torch.constant.int 1
%2518 = torch.aten.mm %2517, %264 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2519 = torch.aten.add.Tensor %2518, %265, %int1_1795 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2520 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1796 = torch.constant.int 1
%int7_1797 = torch.constant.int 7
%int1600_1798 = torch.constant.int 1600
%2521 = torch.prim.ListConstruct %int1_1796, %int7_1797, %int1600_1798 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2522 = torch.aten.reshape %2519, %2521 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1799 = torch.constant.int 1
%2523 = torch.aten.add.Tensor %2492, %2522, %int1_1799 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1800 = torch.constant.float 9.9999997473787516E-6
%int1600_1801 = torch.constant.int 1600
%2524 = torch.prim.ListConstruct %int1600_1801 : (!torch.int) -> !torch.list<int>
%result0_1802, %result1_1803, %result2_1804 = torch.aten.native_layer_norm %2523, %2524, %266, %267, %float9.999990e-06_1800 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2525 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1805 = torch.constant.int 7
%int1600_1806 = torch.constant.int 1600
%2526 = torch.prim.ListConstruct %int7_1805, %int1600_1806 : (!torch.int, !torch.int) -> !torch.list<int>
%2527 = torch.aten.reshape %result0_1802, %2526 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1807 = torch.constant.int 0
%int1_1808 = torch.constant.int 1
%2528 = torch.aten.mm %2527, %268 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2529 = torch.aten.add.Tensor %2528, %269, %int1_1808 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2530 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1809 = torch.constant.int 1
%int7_1810 = torch.constant.int 7
%int4800_1811 = torch.constant.int 4800
%2531 = torch.prim.ListConstruct %int1_1809, %int7_1810, %int4800_1811 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2532 = torch.aten.reshape %2529, %2531 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2533 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2534 = torch.prim.tolist(%2533) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1812 = torch.constant.int 2
%2535 = torch.aten.split_with_sizes %2532, %2534, %int2_1812 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2536:3 = torch.prim.ListUnpack %2535 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2537 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1813 = torch.constant.int 1
%int7_1814 = torch.constant.int 7
%int25_1815 = torch.constant.int 25
%int64_1816 = torch.constant.int 64
%2538 = torch.prim.ListConstruct %int1_1813, %int7_1814, %int25_1815, %int64_1816 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2539 = torch.aten.reshape %2536#0, %2538 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1817 = torch.constant.int 1
%int2_1818 = torch.constant.int 2
%2540 = torch.aten.transpose.int %2539, %int1_1817, %int2_1818 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2541 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1819 = torch.constant.int 1
%int7_1820 = torch.constant.int 7
%int25_1821 = torch.constant.int 25
%int64_1822 = torch.constant.int 64
%2542 = torch.prim.ListConstruct %int1_1819, %int7_1820, %int25_1821, %int64_1822 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2543 = torch.aten.reshape %2536#1, %2542 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1823 = torch.constant.int 1
%int2_1824 = torch.constant.int 2
%2544 = torch.aten.transpose.int %2543, %int1_1823, %int2_1824 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2545 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1825 = torch.constant.int 1
%int7_1826 = torch.constant.int 7
%int25_1827 = torch.constant.int 25
%int64_1828 = torch.constant.int 64
%2546 = torch.prim.ListConstruct %int1_1825, %int7_1826, %int25_1827, %int64_1828 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2547 = torch.aten.reshape %2536#2, %2546 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1829 = torch.constant.int 1
%int2_1830 = torch.constant.int 2
%2548 = torch.aten.transpose.int %2547, %int1_1829, %int2_1830 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1831 = torch.constant.int 1
%int2_1832 = torch.constant.int 2
%2549 = torch.aten.transpose.int %2543, %int1_1831, %int2_1832 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1833 = torch.constant.int 2
%int3_1834 = torch.constant.int 3
%2550 = torch.aten.transpose.int %2549, %int2_1833, %int3_1834 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2551 = torch.aten.matmul %2540, %2550 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2552 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2553 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2554 = torch.aten.pow.Tensor_Tensor %2552, %2553 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2555 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1835 = torch.constant.int 0
%2556 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1836 = torch.constant.none
%float0.000000e00_1837 = torch.constant.float 0.000000e+00
%2557 = torch.aten.full %2556, %float0.000000e00_1837, %none_1836, %none_1836, %none_1836, %none_1836 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1838 = torch.constant.int 1
%2558 = torch.aten.add.Tensor %2557, %2554, %int1_1838 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2559 = torch.aten.div.Tensor %2551, %2558 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2560 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1839 = torch.constant.int 6
%none_1840 = torch.constant.none
%false_1841 = torch.constant.bool false
%2561 = torch.aten.to.dtype %2559, %int6_1839, %false_1841, %false_1841, %none_1840 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2562 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2563 = torch.aten.where.self %2560, %2561, %2562 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1842 = torch.constant.int 3
%none_1843 = torch.constant.none
%2564 = torch.aten.softmax.int %2563, %int3_1842, %none_1843 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1844 = torch.constant.int 6
%none_1845 = torch.constant.none
%false_1846 = torch.constant.bool false
%2565 = torch.aten.to.dtype %2564, %int6_1844, %false_1846, %false_1846, %none_1845 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2566 = torch.aten.matmul %2565, %2548 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1847 = torch.constant.int 1
%int2_1848 = torch.constant.int 2
%2567 = torch.aten.transpose.int %2566, %int1_1847, %int2_1848 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2568 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1849 = torch.constant.int 1
%int7_1850 = torch.constant.int 7
%int1600_1851 = torch.constant.int 1600
%2569 = torch.prim.ListConstruct %int1_1849, %int7_1850, %int1600_1851 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2570 = torch.aten.reshape %2567, %2569 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2571 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1852 = torch.constant.int 7
%int1600_1853 = torch.constant.int 1600
%2572 = torch.prim.ListConstruct %int7_1852, %int1600_1853 : (!torch.int, !torch.int) -> !torch.list<int>
%2573 = torch.aten.reshape %2570, %2572 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1854 = torch.constant.int 0
%int1_1855 = torch.constant.int 1
%2574 = torch.aten.mm %2573, %270 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2575 = torch.aten.add.Tensor %2574, %271, %int1_1855 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2576 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1856 = torch.constant.int 1
%int7_1857 = torch.constant.int 7
%int1600_1858 = torch.constant.int 1600
%2577 = torch.prim.ListConstruct %int1_1856, %int7_1857, %int1600_1858 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2578 = torch.aten.reshape %2575, %2577 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1859 = torch.constant.int 1
%2579 = torch.aten.add.Tensor %2578, %2523, %int1_1859 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1860 = torch.constant.float 9.9999997473787516E-6
%int1600_1861 = torch.constant.int 1600
%2580 = torch.prim.ListConstruct %int1600_1861 : (!torch.int) -> !torch.list<int>
%result0_1862, %result1_1863, %result2_1864 = torch.aten.native_layer_norm %2579, %2580, %272, %273, %float9.999990e-06_1860 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2581 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1865 = torch.constant.int 7
%int1600_1866 = torch.constant.int 1600
%2582 = torch.prim.ListConstruct %int7_1865, %int1600_1866 : (!torch.int, !torch.int) -> !torch.list<int>
%2583 = torch.aten.reshape %result0_1862, %2582 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1867 = torch.constant.int 0
%int1_1868 = torch.constant.int 1
%2584 = torch.aten.mm %2583, %274 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2585 = torch.aten.add.Tensor %2584, %275, %int1_1868 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2586 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1869 = torch.constant.int 1
%int7_1870 = torch.constant.int 7
%int6400_1871 = torch.constant.int 6400
%2587 = torch.prim.ListConstruct %int1_1869, %int7_1870, %int6400_1871 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2588 = torch.aten.reshape %2585, %2587 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2589 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2590 = torch.aten.mul.Tensor %2588, %2589 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2591 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2592 = torch.aten.pow.Tensor_Tensor %2588, %2591 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2593 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2594 = torch.aten.mul.Tensor %2592, %2593 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1872 = torch.constant.int 1
%2595 = torch.aten.add.Tensor %2588, %2594, %int1_1872 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2596 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2597 = torch.aten.mul.Tensor %2595, %2596 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2598 = torch.aten.tanh %2597 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2599 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1873 = torch.constant.int 1
%2600 = torch.aten.add.Tensor %2598, %2599, %int1_1873 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2601 = torch.aten.mul.Tensor %2590, %2600 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2602 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1874 = torch.constant.int 7
%int6400_1875 = torch.constant.int 6400
%2603 = torch.prim.ListConstruct %int7_1874, %int6400_1875 : (!torch.int, !torch.int) -> !torch.list<int>
%2604 = torch.aten.reshape %2601, %2603 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1876 = torch.constant.int 0
%int1_1877 = torch.constant.int 1
%2605 = torch.aten.mm %2604, %276 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2606 = torch.aten.add.Tensor %2605, %277, %int1_1877 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2607 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1878 = torch.constant.int 1
%int7_1879 = torch.constant.int 7
%int1600_1880 = torch.constant.int 1600
%2608 = torch.prim.ListConstruct %int1_1878, %int7_1879, %int1600_1880 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2609 = torch.aten.reshape %2606, %2608 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1881 = torch.constant.int 1
%2610 = torch.aten.add.Tensor %2579, %2609, %int1_1881 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1882 = torch.constant.float 9.9999997473787516E-6
%int1600_1883 = torch.constant.int 1600
%2611 = torch.prim.ListConstruct %int1600_1883 : (!torch.int) -> !torch.list<int>
%result0_1884, %result1_1885, %result2_1886 = torch.aten.native_layer_norm %2610, %2611, %278, %279, %float9.999990e-06_1882 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2612 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1887 = torch.constant.int 7
%int1600_1888 = torch.constant.int 1600
%2613 = torch.prim.ListConstruct %int7_1887, %int1600_1888 : (!torch.int, !torch.int) -> !torch.list<int>
%2614 = torch.aten.reshape %result0_1884, %2613 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1889 = torch.constant.int 0
%int1_1890 = torch.constant.int 1
%2615 = torch.aten.mm %2614, %280 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2616 = torch.aten.add.Tensor %2615, %281, %int1_1890 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2617 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1891 = torch.constant.int 1
%int7_1892 = torch.constant.int 7
%int4800_1893 = torch.constant.int 4800
%2618 = torch.prim.ListConstruct %int1_1891, %int7_1892, %int4800_1893 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2619 = torch.aten.reshape %2616, %2618 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2620 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2621 = torch.prim.tolist(%2620) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1894 = torch.constant.int 2
%2622 = torch.aten.split_with_sizes %2619, %2621, %int2_1894 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2623:3 = torch.prim.ListUnpack %2622 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2624 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1895 = torch.constant.int 1
%int7_1896 = torch.constant.int 7
%int25_1897 = torch.constant.int 25
%int64_1898 = torch.constant.int 64
%2625 = torch.prim.ListConstruct %int1_1895, %int7_1896, %int25_1897, %int64_1898 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2626 = torch.aten.reshape %2623#0, %2625 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1899 = torch.constant.int 1
%int2_1900 = torch.constant.int 2
%2627 = torch.aten.transpose.int %2626, %int1_1899, %int2_1900 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2628 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1901 = torch.constant.int 1
%int7_1902 = torch.constant.int 7
%int25_1903 = torch.constant.int 25
%int64_1904 = torch.constant.int 64
%2629 = torch.prim.ListConstruct %int1_1901, %int7_1902, %int25_1903, %int64_1904 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2630 = torch.aten.reshape %2623#1, %2629 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1905 = torch.constant.int 1
%int2_1906 = torch.constant.int 2
%2631 = torch.aten.transpose.int %2630, %int1_1905, %int2_1906 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2632 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1907 = torch.constant.int 1
%int7_1908 = torch.constant.int 7
%int25_1909 = torch.constant.int 25
%int64_1910 = torch.constant.int 64
%2633 = torch.prim.ListConstruct %int1_1907, %int7_1908, %int25_1909, %int64_1910 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2634 = torch.aten.reshape %2623#2, %2633 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1911 = torch.constant.int 1
%int2_1912 = torch.constant.int 2
%2635 = torch.aten.transpose.int %2634, %int1_1911, %int2_1912 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1913 = torch.constant.int 1
%int2_1914 = torch.constant.int 2
%2636 = torch.aten.transpose.int %2630, %int1_1913, %int2_1914 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1915 = torch.constant.int 2
%int3_1916 = torch.constant.int 3
%2637 = torch.aten.transpose.int %2636, %int2_1915, %int3_1916 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2638 = torch.aten.matmul %2627, %2637 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2639 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2640 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2641 = torch.aten.pow.Tensor_Tensor %2639, %2640 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2642 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1917 = torch.constant.int 0
%2643 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_1918 = torch.constant.none
%float0.000000e00_1919 = torch.constant.float 0.000000e+00
%2644 = torch.aten.full %2643, %float0.000000e00_1919, %none_1918, %none_1918, %none_1918, %none_1918 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_1920 = torch.constant.int 1
%2645 = torch.aten.add.Tensor %2644, %2641, %int1_1920 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2646 = torch.aten.div.Tensor %2638, %2645 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2647 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_1921 = torch.constant.int 6
%none_1922 = torch.constant.none
%false_1923 = torch.constant.bool false
%2648 = torch.aten.to.dtype %2646, %int6_1921, %false_1923, %false_1923, %none_1922 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2649 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2650 = torch.aten.where.self %2647, %2648, %2649 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_1924 = torch.constant.int 3
%none_1925 = torch.constant.none
%2651 = torch.aten.softmax.int %2650, %int3_1924, %none_1925 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_1926 = torch.constant.int 6
%none_1927 = torch.constant.none
%false_1928 = torch.constant.bool false
%2652 = torch.aten.to.dtype %2651, %int6_1926, %false_1928, %false_1928, %none_1927 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2653 = torch.aten.matmul %2652, %2635 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_1929 = torch.constant.int 1
%int2_1930 = torch.constant.int 2
%2654 = torch.aten.transpose.int %2653, %int1_1929, %int2_1930 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2655 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1931 = torch.constant.int 1
%int7_1932 = torch.constant.int 7
%int1600_1933 = torch.constant.int 1600
%2656 = torch.prim.ListConstruct %int1_1931, %int7_1932, %int1600_1933 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2657 = torch.aten.reshape %2654, %2656 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2658 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1934 = torch.constant.int 7
%int1600_1935 = torch.constant.int 1600
%2659 = torch.prim.ListConstruct %int7_1934, %int1600_1935 : (!torch.int, !torch.int) -> !torch.list<int>
%2660 = torch.aten.reshape %2657, %2659 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1936 = torch.constant.int 0
%int1_1937 = torch.constant.int 1
%2661 = torch.aten.mm %2660, %282 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2662 = torch.aten.add.Tensor %2661, %283, %int1_1937 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2663 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1938 = torch.constant.int 1
%int7_1939 = torch.constant.int 7
%int1600_1940 = torch.constant.int 1600
%2664 = torch.prim.ListConstruct %int1_1938, %int7_1939, %int1600_1940 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2665 = torch.aten.reshape %2662, %2664 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1941 = torch.constant.int 1
%2666 = torch.aten.add.Tensor %2665, %2610, %int1_1941 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1942 = torch.constant.float 9.9999997473787516E-6
%int1600_1943 = torch.constant.int 1600
%2667 = torch.prim.ListConstruct %int1600_1943 : (!torch.int) -> !torch.list<int>
%result0_1944, %result1_1945, %result2_1946 = torch.aten.native_layer_norm %2666, %2667, %284, %285, %float9.999990e-06_1942 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2668 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1947 = torch.constant.int 7
%int1600_1948 = torch.constant.int 1600
%2669 = torch.prim.ListConstruct %int7_1947, %int1600_1948 : (!torch.int, !torch.int) -> !torch.list<int>
%2670 = torch.aten.reshape %result0_1944, %2669 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1949 = torch.constant.int 0
%int1_1950 = torch.constant.int 1
%2671 = torch.aten.mm %2670, %286 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2672 = torch.aten.add.Tensor %2671, %287, %int1_1950 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2673 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1951 = torch.constant.int 1
%int7_1952 = torch.constant.int 7
%int6400_1953 = torch.constant.int 6400
%2674 = torch.prim.ListConstruct %int1_1951, %int7_1952, %int6400_1953 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2675 = torch.aten.reshape %2672, %2674 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2676 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2677 = torch.aten.mul.Tensor %2675, %2676 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2678 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2679 = torch.aten.pow.Tensor_Tensor %2675, %2678 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2680 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2681 = torch.aten.mul.Tensor %2679, %2680 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_1954 = torch.constant.int 1
%2682 = torch.aten.add.Tensor %2675, %2681, %int1_1954 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2683 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2684 = torch.aten.mul.Tensor %2682, %2683 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2685 = torch.aten.tanh %2684 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2686 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_1955 = torch.constant.int 1
%2687 = torch.aten.add.Tensor %2685, %2686, %int1_1955 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2688 = torch.aten.mul.Tensor %2677, %2687 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2689 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1956 = torch.constant.int 7
%int6400_1957 = torch.constant.int 6400
%2690 = torch.prim.ListConstruct %int7_1956, %int6400_1957 : (!torch.int, !torch.int) -> !torch.list<int>
%2691 = torch.aten.reshape %2688, %2690 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_1958 = torch.constant.int 0
%int1_1959 = torch.constant.int 1
%2692 = torch.aten.mm %2691, %288 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2693 = torch.aten.add.Tensor %2692, %289, %int1_1959 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2694 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1960 = torch.constant.int 1
%int7_1961 = torch.constant.int 7
%int1600_1962 = torch.constant.int 1600
%2695 = torch.prim.ListConstruct %int1_1960, %int7_1961, %int1600_1962 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2696 = torch.aten.reshape %2693, %2695 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_1963 = torch.constant.int 1
%2697 = torch.aten.add.Tensor %2666, %2696, %int1_1963 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_1964 = torch.constant.float 9.9999997473787516E-6
%int1600_1965 = torch.constant.int 1600
%2698 = torch.prim.ListConstruct %int1600_1965 : (!torch.int) -> !torch.list<int>
%result0_1966, %result1_1967, %result2_1968 = torch.aten.native_layer_norm %2697, %2698, %290, %291, %float9.999990e-06_1964 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2699 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_1969 = torch.constant.int 7
%int1600_1970 = torch.constant.int 1600
%2700 = torch.prim.ListConstruct %int7_1969, %int1600_1970 : (!torch.int, !torch.int) -> !torch.list<int>
%2701 = torch.aten.reshape %result0_1966, %2700 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_1971 = torch.constant.int 0
%int1_1972 = torch.constant.int 1
%2702 = torch.aten.mm %2701, %292 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2703 = torch.aten.add.Tensor %2702, %293, %int1_1972 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2704 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_1973 = torch.constant.int 1
%int7_1974 = torch.constant.int 7
%int4800_1975 = torch.constant.int 4800
%2705 = torch.prim.ListConstruct %int1_1973, %int7_1974, %int4800_1975 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2706 = torch.aten.reshape %2703, %2705 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2707 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2708 = torch.prim.tolist(%2707) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_1976 = torch.constant.int 2
%2709 = torch.aten.split_with_sizes %2706, %2708, %int2_1976 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2710:3 = torch.prim.ListUnpack %2709 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2711 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1977 = torch.constant.int 1
%int7_1978 = torch.constant.int 7
%int25_1979 = torch.constant.int 25
%int64_1980 = torch.constant.int 64
%2712 = torch.prim.ListConstruct %int1_1977, %int7_1978, %int25_1979, %int64_1980 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2713 = torch.aten.reshape %2710#0, %2712 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1981 = torch.constant.int 1
%int2_1982 = torch.constant.int 2
%2714 = torch.aten.transpose.int %2713, %int1_1981, %int2_1982 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2715 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1983 = torch.constant.int 1
%int7_1984 = torch.constant.int 7
%int25_1985 = torch.constant.int 25
%int64_1986 = torch.constant.int 64
%2716 = torch.prim.ListConstruct %int1_1983, %int7_1984, %int25_1985, %int64_1986 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2717 = torch.aten.reshape %2710#1, %2716 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1987 = torch.constant.int 1
%int2_1988 = torch.constant.int 2
%2718 = torch.aten.transpose.int %2717, %int1_1987, %int2_1988 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2719 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_1989 = torch.constant.int 1
%int7_1990 = torch.constant.int 7
%int25_1991 = torch.constant.int 25
%int64_1992 = torch.constant.int 64
%2720 = torch.prim.ListConstruct %int1_1989, %int7_1990, %int25_1991, %int64_1992 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2721 = torch.aten.reshape %2710#2, %2720 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_1993 = torch.constant.int 1
%int2_1994 = torch.constant.int 2
%2722 = torch.aten.transpose.int %2721, %int1_1993, %int2_1994 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_1995 = torch.constant.int 1
%int2_1996 = torch.constant.int 2
%2723 = torch.aten.transpose.int %2717, %int1_1995, %int2_1996 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_1997 = torch.constant.int 2
%int3_1998 = torch.constant.int 3
%2724 = torch.aten.transpose.int %2723, %int2_1997, %int3_1998 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2725 = torch.aten.matmul %2714, %2724 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2726 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2727 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2728 = torch.aten.pow.Tensor_Tensor %2726, %2727 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2729 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_1999 = torch.constant.int 0
%2730 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2000 = torch.constant.none
%float0.000000e00_2001 = torch.constant.float 0.000000e+00
%2731 = torch.aten.full %2730, %float0.000000e00_2001, %none_2000, %none_2000, %none_2000, %none_2000 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2002 = torch.constant.int 1
%2732 = torch.aten.add.Tensor %2731, %2728, %int1_2002 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2733 = torch.aten.div.Tensor %2725, %2732 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2734 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2003 = torch.constant.int 6
%none_2004 = torch.constant.none
%false_2005 = torch.constant.bool false
%2735 = torch.aten.to.dtype %2733, %int6_2003, %false_2005, %false_2005, %none_2004 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2736 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2737 = torch.aten.where.self %2734, %2735, %2736 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2006 = torch.constant.int 3
%none_2007 = torch.constant.none
%2738 = torch.aten.softmax.int %2737, %int3_2006, %none_2007 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2008 = torch.constant.int 6
%none_2009 = torch.constant.none
%false_2010 = torch.constant.bool false
%2739 = torch.aten.to.dtype %2738, %int6_2008, %false_2010, %false_2010, %none_2009 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2740 = torch.aten.matmul %2739, %2722 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2011 = torch.constant.int 1
%int2_2012 = torch.constant.int 2
%2741 = torch.aten.transpose.int %2740, %int1_2011, %int2_2012 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2742 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2013 = torch.constant.int 1
%int7_2014 = torch.constant.int 7
%int1600_2015 = torch.constant.int 1600
%2743 = torch.prim.ListConstruct %int1_2013, %int7_2014, %int1600_2015 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2744 = torch.aten.reshape %2741, %2743 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2745 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2016 = torch.constant.int 7
%int1600_2017 = torch.constant.int 1600
%2746 = torch.prim.ListConstruct %int7_2016, %int1600_2017 : (!torch.int, !torch.int) -> !torch.list<int>
%2747 = torch.aten.reshape %2744, %2746 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2018 = torch.constant.int 0
%int1_2019 = torch.constant.int 1
%2748 = torch.aten.mm %2747, %294 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2749 = torch.aten.add.Tensor %2748, %295, %int1_2019 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2750 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2020 = torch.constant.int 1
%int7_2021 = torch.constant.int 7
%int1600_2022 = torch.constant.int 1600
%2751 = torch.prim.ListConstruct %int1_2020, %int7_2021, %int1600_2022 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2752 = torch.aten.reshape %2749, %2751 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2023 = torch.constant.int 1
%2753 = torch.aten.add.Tensor %2752, %2697, %int1_2023 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2024 = torch.constant.float 9.9999997473787516E-6
%int1600_2025 = torch.constant.int 1600
%2754 = torch.prim.ListConstruct %int1600_2025 : (!torch.int) -> !torch.list<int>
%result0_2026, %result1_2027, %result2_2028 = torch.aten.native_layer_norm %2753, %2754, %296, %297, %float9.999990e-06_2024 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2755 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2029 = torch.constant.int 7
%int1600_2030 = torch.constant.int 1600
%2756 = torch.prim.ListConstruct %int7_2029, %int1600_2030 : (!torch.int, !torch.int) -> !torch.list<int>
%2757 = torch.aten.reshape %result0_2026, %2756 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2031 = torch.constant.int 0
%int1_2032 = torch.constant.int 1
%2758 = torch.aten.mm %2757, %298 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2759 = torch.aten.add.Tensor %2758, %299, %int1_2032 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2760 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2033 = torch.constant.int 1
%int7_2034 = torch.constant.int 7
%int6400_2035 = torch.constant.int 6400
%2761 = torch.prim.ListConstruct %int1_2033, %int7_2034, %int6400_2035 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2762 = torch.aten.reshape %2759, %2761 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2763 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2764 = torch.aten.mul.Tensor %2762, %2763 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2765 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2766 = torch.aten.pow.Tensor_Tensor %2762, %2765 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2767 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2768 = torch.aten.mul.Tensor %2766, %2767 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2036 = torch.constant.int 1
%2769 = torch.aten.add.Tensor %2762, %2768, %int1_2036 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2770 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2771 = torch.aten.mul.Tensor %2769, %2770 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2772 = torch.aten.tanh %2771 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2773 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2037 = torch.constant.int 1
%2774 = torch.aten.add.Tensor %2772, %2773, %int1_2037 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2775 = torch.aten.mul.Tensor %2764, %2774 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2776 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2038 = torch.constant.int 7
%int6400_2039 = torch.constant.int 6400
%2777 = torch.prim.ListConstruct %int7_2038, %int6400_2039 : (!torch.int, !torch.int) -> !torch.list<int>
%2778 = torch.aten.reshape %2775, %2777 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2040 = torch.constant.int 0
%int1_2041 = torch.constant.int 1
%2779 = torch.aten.mm %2778, %300 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2780 = torch.aten.add.Tensor %2779, %301, %int1_2041 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2781 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2042 = torch.constant.int 1
%int7_2043 = torch.constant.int 7
%int1600_2044 = torch.constant.int 1600
%2782 = torch.prim.ListConstruct %int1_2042, %int7_2043, %int1600_2044 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2783 = torch.aten.reshape %2780, %2782 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2045 = torch.constant.int 1
%2784 = torch.aten.add.Tensor %2753, %2783, %int1_2045 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2046 = torch.constant.float 9.9999997473787516E-6
%int1600_2047 = torch.constant.int 1600
%2785 = torch.prim.ListConstruct %int1600_2047 : (!torch.int) -> !torch.list<int>
%result0_2048, %result1_2049, %result2_2050 = torch.aten.native_layer_norm %2784, %2785, %302, %303, %float9.999990e-06_2046 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2786 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2051 = torch.constant.int 7
%int1600_2052 = torch.constant.int 1600
%2787 = torch.prim.ListConstruct %int7_2051, %int1600_2052 : (!torch.int, !torch.int) -> !torch.list<int>
%2788 = torch.aten.reshape %result0_2048, %2787 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2053 = torch.constant.int 0
%int1_2054 = torch.constant.int 1
%2789 = torch.aten.mm %2788, %304 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2790 = torch.aten.add.Tensor %2789, %305, %int1_2054 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2791 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2055 = torch.constant.int 1
%int7_2056 = torch.constant.int 7
%int4800_2057 = torch.constant.int 4800
%2792 = torch.prim.ListConstruct %int1_2055, %int7_2056, %int4800_2057 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2793 = torch.aten.reshape %2790, %2792 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2794 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2795 = torch.prim.tolist(%2794) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2058 = torch.constant.int 2
%2796 = torch.aten.split_with_sizes %2793, %2795, %int2_2058 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2797:3 = torch.prim.ListUnpack %2796 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2798 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2059 = torch.constant.int 1
%int7_2060 = torch.constant.int 7
%int25_2061 = torch.constant.int 25
%int64_2062 = torch.constant.int 64
%2799 = torch.prim.ListConstruct %int1_2059, %int7_2060, %int25_2061, %int64_2062 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2800 = torch.aten.reshape %2797#0, %2799 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2063 = torch.constant.int 1
%int2_2064 = torch.constant.int 2
%2801 = torch.aten.transpose.int %2800, %int1_2063, %int2_2064 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2802 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2065 = torch.constant.int 1
%int7_2066 = torch.constant.int 7
%int25_2067 = torch.constant.int 25
%int64_2068 = torch.constant.int 64
%2803 = torch.prim.ListConstruct %int1_2065, %int7_2066, %int25_2067, %int64_2068 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2804 = torch.aten.reshape %2797#1, %2803 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2069 = torch.constant.int 1
%int2_2070 = torch.constant.int 2
%2805 = torch.aten.transpose.int %2804, %int1_2069, %int2_2070 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2806 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2071 = torch.constant.int 1
%int7_2072 = torch.constant.int 7
%int25_2073 = torch.constant.int 25
%int64_2074 = torch.constant.int 64
%2807 = torch.prim.ListConstruct %int1_2071, %int7_2072, %int25_2073, %int64_2074 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2808 = torch.aten.reshape %2797#2, %2807 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2075 = torch.constant.int 1
%int2_2076 = torch.constant.int 2
%2809 = torch.aten.transpose.int %2808, %int1_2075, %int2_2076 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2077 = torch.constant.int 1
%int2_2078 = torch.constant.int 2
%2810 = torch.aten.transpose.int %2804, %int1_2077, %int2_2078 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2079 = torch.constant.int 2
%int3_2080 = torch.constant.int 3
%2811 = torch.aten.transpose.int %2810, %int2_2079, %int3_2080 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2812 = torch.aten.matmul %2801, %2811 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2813 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2814 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2815 = torch.aten.pow.Tensor_Tensor %2813, %2814 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2816 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2081 = torch.constant.int 0
%2817 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2082 = torch.constant.none
%float0.000000e00_2083 = torch.constant.float 0.000000e+00
%2818 = torch.aten.full %2817, %float0.000000e00_2083, %none_2082, %none_2082, %none_2082, %none_2082 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2084 = torch.constant.int 1
%2819 = torch.aten.add.Tensor %2818, %2815, %int1_2084 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2820 = torch.aten.div.Tensor %2812, %2819 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2821 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2085 = torch.constant.int 6
%none_2086 = torch.constant.none
%false_2087 = torch.constant.bool false
%2822 = torch.aten.to.dtype %2820, %int6_2085, %false_2087, %false_2087, %none_2086 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2823 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2824 = torch.aten.where.self %2821, %2822, %2823 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2088 = torch.constant.int 3
%none_2089 = torch.constant.none
%2825 = torch.aten.softmax.int %2824, %int3_2088, %none_2089 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2090 = torch.constant.int 6
%none_2091 = torch.constant.none
%false_2092 = torch.constant.bool false
%2826 = torch.aten.to.dtype %2825, %int6_2090, %false_2092, %false_2092, %none_2091 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2827 = torch.aten.matmul %2826, %2809 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2093 = torch.constant.int 1
%int2_2094 = torch.constant.int 2
%2828 = torch.aten.transpose.int %2827, %int1_2093, %int2_2094 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2829 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2095 = torch.constant.int 1
%int7_2096 = torch.constant.int 7
%int1600_2097 = torch.constant.int 1600
%2830 = torch.prim.ListConstruct %int1_2095, %int7_2096, %int1600_2097 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2831 = torch.aten.reshape %2828, %2830 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2832 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2098 = torch.constant.int 7
%int1600_2099 = torch.constant.int 1600
%2833 = torch.prim.ListConstruct %int7_2098, %int1600_2099 : (!torch.int, !torch.int) -> !torch.list<int>
%2834 = torch.aten.reshape %2831, %2833 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2100 = torch.constant.int 0
%int1_2101 = torch.constant.int 1
%2835 = torch.aten.mm %2834, %306 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2836 = torch.aten.add.Tensor %2835, %307, %int1_2101 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2837 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2102 = torch.constant.int 1
%int7_2103 = torch.constant.int 7
%int1600_2104 = torch.constant.int 1600
%2838 = torch.prim.ListConstruct %int1_2102, %int7_2103, %int1600_2104 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2839 = torch.aten.reshape %2836, %2838 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2105 = torch.constant.int 1
%2840 = torch.aten.add.Tensor %2839, %2784, %int1_2105 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2106 = torch.constant.float 9.9999997473787516E-6
%int1600_2107 = torch.constant.int 1600
%2841 = torch.prim.ListConstruct %int1600_2107 : (!torch.int) -> !torch.list<int>
%result0_2108, %result1_2109, %result2_2110 = torch.aten.native_layer_norm %2840, %2841, %308, %309, %float9.999990e-06_2106 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2842 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2111 = torch.constant.int 7
%int1600_2112 = torch.constant.int 1600
%2843 = torch.prim.ListConstruct %int7_2111, %int1600_2112 : (!torch.int, !torch.int) -> !torch.list<int>
%2844 = torch.aten.reshape %result0_2108, %2843 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2113 = torch.constant.int 0
%int1_2114 = torch.constant.int 1
%2845 = torch.aten.mm %2844, %310 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2846 = torch.aten.add.Tensor %2845, %311, %int1_2114 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2847 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2115 = torch.constant.int 1
%int7_2116 = torch.constant.int 7
%int6400_2117 = torch.constant.int 6400
%2848 = torch.prim.ListConstruct %int1_2115, %int7_2116, %int6400_2117 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2849 = torch.aten.reshape %2846, %2848 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2850 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2851 = torch.aten.mul.Tensor %2849, %2850 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2852 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2853 = torch.aten.pow.Tensor_Tensor %2849, %2852 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2854 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2855 = torch.aten.mul.Tensor %2853, %2854 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2118 = torch.constant.int 1
%2856 = torch.aten.add.Tensor %2849, %2855, %int1_2118 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2857 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2858 = torch.aten.mul.Tensor %2856, %2857 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2859 = torch.aten.tanh %2858 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2860 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2119 = torch.constant.int 1
%2861 = torch.aten.add.Tensor %2859, %2860, %int1_2119 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2862 = torch.aten.mul.Tensor %2851, %2861 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2863 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2120 = torch.constant.int 7
%int6400_2121 = torch.constant.int 6400
%2864 = torch.prim.ListConstruct %int7_2120, %int6400_2121 : (!torch.int, !torch.int) -> !torch.list<int>
%2865 = torch.aten.reshape %2862, %2864 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2122 = torch.constant.int 0
%int1_2123 = torch.constant.int 1
%2866 = torch.aten.mm %2865, %312 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2867 = torch.aten.add.Tensor %2866, %313, %int1_2123 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2868 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2124 = torch.constant.int 1
%int7_2125 = torch.constant.int 7
%int1600_2126 = torch.constant.int 1600
%2869 = torch.prim.ListConstruct %int1_2124, %int7_2125, %int1600_2126 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2870 = torch.aten.reshape %2867, %2869 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2127 = torch.constant.int 1
%2871 = torch.aten.add.Tensor %2840, %2870, %int1_2127 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2128 = torch.constant.float 9.9999997473787516E-6
%int1600_2129 = torch.constant.int 1600
%2872 = torch.prim.ListConstruct %int1600_2129 : (!torch.int) -> !torch.list<int>
%result0_2130, %result1_2131, %result2_2132 = torch.aten.native_layer_norm %2871, %2872, %314, %315, %float9.999990e-06_2128 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2873 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2133 = torch.constant.int 7
%int1600_2134 = torch.constant.int 1600
%2874 = torch.prim.ListConstruct %int7_2133, %int1600_2134 : (!torch.int, !torch.int) -> !torch.list<int>
%2875 = torch.aten.reshape %result0_2130, %2874 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2135 = torch.constant.int 0
%int1_2136 = torch.constant.int 1
%2876 = torch.aten.mm %2875, %316 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2877 = torch.aten.add.Tensor %2876, %317, %int1_2136 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2878 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2137 = torch.constant.int 1
%int7_2138 = torch.constant.int 7
%int4800_2139 = torch.constant.int 4800
%2879 = torch.prim.ListConstruct %int1_2137, %int7_2138, %int4800_2139 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2880 = torch.aten.reshape %2877, %2879 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2881 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2882 = torch.prim.tolist(%2881) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2140 = torch.constant.int 2
%2883 = torch.aten.split_with_sizes %2880, %2882, %int2_2140 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2884:3 = torch.prim.ListUnpack %2883 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2885 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2141 = torch.constant.int 1
%int7_2142 = torch.constant.int 7
%int25_2143 = torch.constant.int 25
%int64_2144 = torch.constant.int 64
%2886 = torch.prim.ListConstruct %int1_2141, %int7_2142, %int25_2143, %int64_2144 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2887 = torch.aten.reshape %2884#0, %2886 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2145 = torch.constant.int 1
%int2_2146 = torch.constant.int 2
%2888 = torch.aten.transpose.int %2887, %int1_2145, %int2_2146 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2889 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2147 = torch.constant.int 1
%int7_2148 = torch.constant.int 7
%int25_2149 = torch.constant.int 25
%int64_2150 = torch.constant.int 64
%2890 = torch.prim.ListConstruct %int1_2147, %int7_2148, %int25_2149, %int64_2150 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2891 = torch.aten.reshape %2884#1, %2890 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2151 = torch.constant.int 1
%int2_2152 = torch.constant.int 2
%2892 = torch.aten.transpose.int %2891, %int1_2151, %int2_2152 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2893 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2153 = torch.constant.int 1
%int7_2154 = torch.constant.int 7
%int25_2155 = torch.constant.int 25
%int64_2156 = torch.constant.int 64
%2894 = torch.prim.ListConstruct %int1_2153, %int7_2154, %int25_2155, %int64_2156 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2895 = torch.aten.reshape %2884#2, %2894 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2157 = torch.constant.int 1
%int2_2158 = torch.constant.int 2
%2896 = torch.aten.transpose.int %2895, %int1_2157, %int2_2158 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2159 = torch.constant.int 1
%int2_2160 = torch.constant.int 2
%2897 = torch.aten.transpose.int %2891, %int1_2159, %int2_2160 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2161 = torch.constant.int 2
%int3_2162 = torch.constant.int 3
%2898 = torch.aten.transpose.int %2897, %int2_2161, %int3_2162 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2899 = torch.aten.matmul %2888, %2898 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2900 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2901 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2902 = torch.aten.pow.Tensor_Tensor %2900, %2901 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2903 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2163 = torch.constant.int 0
%2904 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2164 = torch.constant.none
%float0.000000e00_2165 = torch.constant.float 0.000000e+00
%2905 = torch.aten.full %2904, %float0.000000e00_2165, %none_2164, %none_2164, %none_2164, %none_2164 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2166 = torch.constant.int 1
%2906 = torch.aten.add.Tensor %2905, %2902, %int1_2166 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2907 = torch.aten.div.Tensor %2899, %2906 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2908 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2167 = torch.constant.int 6
%none_2168 = torch.constant.none
%false_2169 = torch.constant.bool false
%2909 = torch.aten.to.dtype %2907, %int6_2167, %false_2169, %false_2169, %none_2168 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2910 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2911 = torch.aten.where.self %2908, %2909, %2910 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2170 = torch.constant.int 3
%none_2171 = torch.constant.none
%2912 = torch.aten.softmax.int %2911, %int3_2170, %none_2171 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2172 = torch.constant.int 6
%none_2173 = torch.constant.none
%false_2174 = torch.constant.bool false
%2913 = torch.aten.to.dtype %2912, %int6_2172, %false_2174, %false_2174, %none_2173 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2914 = torch.aten.matmul %2913, %2896 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2175 = torch.constant.int 1
%int2_2176 = torch.constant.int 2
%2915 = torch.aten.transpose.int %2914, %int1_2175, %int2_2176 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%2916 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2177 = torch.constant.int 1
%int7_2178 = torch.constant.int 7
%int1600_2179 = torch.constant.int 1600
%2917 = torch.prim.ListConstruct %int1_2177, %int7_2178, %int1600_2179 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2918 = torch.aten.reshape %2915, %2917 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%2919 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2180 = torch.constant.int 7
%int1600_2181 = torch.constant.int 1600
%2920 = torch.prim.ListConstruct %int7_2180, %int1600_2181 : (!torch.int, !torch.int) -> !torch.list<int>
%2921 = torch.aten.reshape %2918, %2920 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2182 = torch.constant.int 0
%int1_2183 = torch.constant.int 1
%2922 = torch.aten.mm %2921, %318 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2923 = torch.aten.add.Tensor %2922, %319, %int1_2183 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2924 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2184 = torch.constant.int 1
%int7_2185 = torch.constant.int 7
%int1600_2186 = torch.constant.int 1600
%2925 = torch.prim.ListConstruct %int1_2184, %int7_2185, %int1600_2186 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2926 = torch.aten.reshape %2923, %2925 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2187 = torch.constant.int 1
%2927 = torch.aten.add.Tensor %2926, %2871, %int1_2187 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2188 = torch.constant.float 9.9999997473787516E-6
%int1600_2189 = torch.constant.int 1600
%2928 = torch.prim.ListConstruct %int1600_2189 : (!torch.int) -> !torch.list<int>
%result0_2190, %result1_2191, %result2_2192 = torch.aten.native_layer_norm %2927, %2928, %320, %321, %float9.999990e-06_2188 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2929 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2193 = torch.constant.int 7
%int1600_2194 = torch.constant.int 1600
%2930 = torch.prim.ListConstruct %int7_2193, %int1600_2194 : (!torch.int, !torch.int) -> !torch.list<int>
%2931 = torch.aten.reshape %result0_2190, %2930 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2195 = torch.constant.int 0
%int1_2196 = torch.constant.int 1
%2932 = torch.aten.mm %2931, %322 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%2933 = torch.aten.add.Tensor %2932, %323, %int1_2196 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%2934 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2197 = torch.constant.int 1
%int7_2198 = torch.constant.int 7
%int6400_2199 = torch.constant.int 6400
%2935 = torch.prim.ListConstruct %int1_2197, %int7_2198, %int6400_2199 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2936 = torch.aten.reshape %2933, %2935 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%2937 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2938 = torch.aten.mul.Tensor %2936, %2937 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2939 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%2940 = torch.aten.pow.Tensor_Tensor %2936, %2939 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2941 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%2942 = torch.aten.mul.Tensor %2940, %2941 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2200 = torch.constant.int 1
%2943 = torch.aten.add.Tensor %2936, %2942, %int1_2200 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2944 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%2945 = torch.aten.mul.Tensor %2943, %2944 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%2946 = torch.aten.tanh %2945 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2947 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2201 = torch.constant.int 1
%2948 = torch.aten.add.Tensor %2946, %2947, %int1_2201 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%2949 = torch.aten.mul.Tensor %2938, %2948 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%2950 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2202 = torch.constant.int 7
%int6400_2203 = torch.constant.int 6400
%2951 = torch.prim.ListConstruct %int7_2202, %int6400_2203 : (!torch.int, !torch.int) -> !torch.list<int>
%2952 = torch.aten.reshape %2949, %2951 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2204 = torch.constant.int 0
%int1_2205 = torch.constant.int 1
%2953 = torch.aten.mm %2952, %324 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%2954 = torch.aten.add.Tensor %2953, %325, %int1_2205 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%2955 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2206 = torch.constant.int 1
%int7_2207 = torch.constant.int 7
%int1600_2208 = torch.constant.int 1600
%2956 = torch.prim.ListConstruct %int1_2206, %int7_2207, %int1600_2208 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2957 = torch.aten.reshape %2954, %2956 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2209 = torch.constant.int 1
%2958 = torch.aten.add.Tensor %2927, %2957, %int1_2209 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2210 = torch.constant.float 9.9999997473787516E-6
%int1600_2211 = torch.constant.int 1600
%2959 = torch.prim.ListConstruct %int1600_2211 : (!torch.int) -> !torch.list<int>
%result0_2212, %result1_2213, %result2_2214 = torch.aten.native_layer_norm %2958, %2959, %326, %327, %float9.999990e-06_2210 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%2960 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2215 = torch.constant.int 7
%int1600_2216 = torch.constant.int 1600
%2961 = torch.prim.ListConstruct %int7_2215, %int1600_2216 : (!torch.int, !torch.int) -> !torch.list<int>
%2962 = torch.aten.reshape %result0_2212, %2961 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2217 = torch.constant.int 0
%int1_2218 = torch.constant.int 1
%2963 = torch.aten.mm %2962, %328 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%2964 = torch.aten.add.Tensor %2963, %329, %int1_2218 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%2965 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2219 = torch.constant.int 1
%int7_2220 = torch.constant.int 7
%int4800_2221 = torch.constant.int 4800
%2966 = torch.prim.ListConstruct %int1_2219, %int7_2220, %int4800_2221 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2967 = torch.aten.reshape %2964, %2966 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%2968 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%2969 = torch.prim.tolist(%2968) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2222 = torch.constant.int 2
%2970 = torch.aten.split_with_sizes %2967, %2969, %int2_2222 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%2971:3 = torch.prim.ListUnpack %2970 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%2972 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2223 = torch.constant.int 1
%int7_2224 = torch.constant.int 7
%int25_2225 = torch.constant.int 25
%int64_2226 = torch.constant.int 64
%2973 = torch.prim.ListConstruct %int1_2223, %int7_2224, %int25_2225, %int64_2226 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2974 = torch.aten.reshape %2971#0, %2973 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2227 = torch.constant.int 1
%int2_2228 = torch.constant.int 2
%2975 = torch.aten.transpose.int %2974, %int1_2227, %int2_2228 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2976 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2229 = torch.constant.int 1
%int7_2230 = torch.constant.int 7
%int25_2231 = torch.constant.int 25
%int64_2232 = torch.constant.int 64
%2977 = torch.prim.ListConstruct %int1_2229, %int7_2230, %int25_2231, %int64_2232 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2978 = torch.aten.reshape %2971#1, %2977 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2233 = torch.constant.int 1
%int2_2234 = torch.constant.int 2
%2979 = torch.aten.transpose.int %2978, %int1_2233, %int2_2234 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%2980 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2235 = torch.constant.int 1
%int7_2236 = torch.constant.int 7
%int25_2237 = torch.constant.int 25
%int64_2238 = torch.constant.int 64
%2981 = torch.prim.ListConstruct %int1_2235, %int7_2236, %int25_2237, %int64_2238 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%2982 = torch.aten.reshape %2971#2, %2981 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2239 = torch.constant.int 1
%int2_2240 = torch.constant.int 2
%2983 = torch.aten.transpose.int %2982, %int1_2239, %int2_2240 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2241 = torch.constant.int 1
%int2_2242 = torch.constant.int 2
%2984 = torch.aten.transpose.int %2978, %int1_2241, %int2_2242 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2243 = torch.constant.int 2
%int3_2244 = torch.constant.int 3
%2985 = torch.aten.transpose.int %2984, %int2_2243, %int3_2244 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%2986 = torch.aten.matmul %2975, %2985 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2987 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%2988 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%2989 = torch.aten.pow.Tensor_Tensor %2987, %2988 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%2990 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2245 = torch.constant.int 0
%2991 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2246 = torch.constant.none
%float0.000000e00_2247 = torch.constant.float 0.000000e+00
%2992 = torch.aten.full %2991, %float0.000000e00_2247, %none_2246, %none_2246, %none_2246, %none_2246 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2248 = torch.constant.int 1
%2993 = torch.aten.add.Tensor %2992, %2989, %int1_2248 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%2994 = torch.aten.div.Tensor %2986, %2993 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%2995 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2249 = torch.constant.int 6
%none_2250 = torch.constant.none
%false_2251 = torch.constant.bool false
%2996 = torch.aten.to.dtype %2994, %int6_2249, %false_2251, %false_2251, %none_2250 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%2997 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%2998 = torch.aten.where.self %2995, %2996, %2997 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2252 = torch.constant.int 3
%none_2253 = torch.constant.none
%2999 = torch.aten.softmax.int %2998, %int3_2252, %none_2253 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2254 = torch.constant.int 6
%none_2255 = torch.constant.none
%false_2256 = torch.constant.bool false
%3000 = torch.aten.to.dtype %2999, %int6_2254, %false_2256, %false_2256, %none_2255 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3001 = torch.aten.matmul %3000, %2983 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2257 = torch.constant.int 1
%int2_2258 = torch.constant.int 2
%3002 = torch.aten.transpose.int %3001, %int1_2257, %int2_2258 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3003 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2259 = torch.constant.int 1
%int7_2260 = torch.constant.int 7
%int1600_2261 = torch.constant.int 1600
%3004 = torch.prim.ListConstruct %int1_2259, %int7_2260, %int1600_2261 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3005 = torch.aten.reshape %3002, %3004 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3006 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2262 = torch.constant.int 7
%int1600_2263 = torch.constant.int 1600
%3007 = torch.prim.ListConstruct %int7_2262, %int1600_2263 : (!torch.int, !torch.int) -> !torch.list<int>
%3008 = torch.aten.reshape %3005, %3007 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2264 = torch.constant.int 0
%int1_2265 = torch.constant.int 1
%3009 = torch.aten.mm %3008, %330 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3010 = torch.aten.add.Tensor %3009, %331, %int1_2265 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3011 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2266 = torch.constant.int 1
%int7_2267 = torch.constant.int 7
%int1600_2268 = torch.constant.int 1600
%3012 = torch.prim.ListConstruct %int1_2266, %int7_2267, %int1600_2268 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3013 = torch.aten.reshape %3010, %3012 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2269 = torch.constant.int 1
%3014 = torch.aten.add.Tensor %3013, %2958, %int1_2269 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2270 = torch.constant.float 9.9999997473787516E-6
%int1600_2271 = torch.constant.int 1600
%3015 = torch.prim.ListConstruct %int1600_2271 : (!torch.int) -> !torch.list<int>
%result0_2272, %result1_2273, %result2_2274 = torch.aten.native_layer_norm %3014, %3015, %332, %333, %float9.999990e-06_2270 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3016 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2275 = torch.constant.int 7
%int1600_2276 = torch.constant.int 1600
%3017 = torch.prim.ListConstruct %int7_2275, %int1600_2276 : (!torch.int, !torch.int) -> !torch.list<int>
%3018 = torch.aten.reshape %result0_2272, %3017 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2277 = torch.constant.int 0
%int1_2278 = torch.constant.int 1
%3019 = torch.aten.mm %3018, %334 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3020 = torch.aten.add.Tensor %3019, %335, %int1_2278 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3021 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2279 = torch.constant.int 1
%int7_2280 = torch.constant.int 7
%int6400_2281 = torch.constant.int 6400
%3022 = torch.prim.ListConstruct %int1_2279, %int7_2280, %int6400_2281 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3023 = torch.aten.reshape %3020, %3022 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3024 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3025 = torch.aten.mul.Tensor %3023, %3024 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3026 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3027 = torch.aten.pow.Tensor_Tensor %3023, %3026 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3028 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3029 = torch.aten.mul.Tensor %3027, %3028 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2282 = torch.constant.int 1
%3030 = torch.aten.add.Tensor %3023, %3029, %int1_2282 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3031 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3032 = torch.aten.mul.Tensor %3030, %3031 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3033 = torch.aten.tanh %3032 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3034 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2283 = torch.constant.int 1
%3035 = torch.aten.add.Tensor %3033, %3034, %int1_2283 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3036 = torch.aten.mul.Tensor %3025, %3035 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3037 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2284 = torch.constant.int 7
%int6400_2285 = torch.constant.int 6400
%3038 = torch.prim.ListConstruct %int7_2284, %int6400_2285 : (!torch.int, !torch.int) -> !torch.list<int>
%3039 = torch.aten.reshape %3036, %3038 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2286 = torch.constant.int 0
%int1_2287 = torch.constant.int 1
%3040 = torch.aten.mm %3039, %336 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3041 = torch.aten.add.Tensor %3040, %337, %int1_2287 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3042 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2288 = torch.constant.int 1
%int7_2289 = torch.constant.int 7
%int1600_2290 = torch.constant.int 1600
%3043 = torch.prim.ListConstruct %int1_2288, %int7_2289, %int1600_2290 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3044 = torch.aten.reshape %3041, %3043 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2291 = torch.constant.int 1
%3045 = torch.aten.add.Tensor %3014, %3044, %int1_2291 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2292 = torch.constant.float 9.9999997473787516E-6
%int1600_2293 = torch.constant.int 1600
%3046 = torch.prim.ListConstruct %int1600_2293 : (!torch.int) -> !torch.list<int>
%result0_2294, %result1_2295, %result2_2296 = torch.aten.native_layer_norm %3045, %3046, %338, %339, %float9.999990e-06_2292 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3047 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2297 = torch.constant.int 7
%int1600_2298 = torch.constant.int 1600
%3048 = torch.prim.ListConstruct %int7_2297, %int1600_2298 : (!torch.int, !torch.int) -> !torch.list<int>
%3049 = torch.aten.reshape %result0_2294, %3048 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2299 = torch.constant.int 0
%int1_2300 = torch.constant.int 1
%3050 = torch.aten.mm %3049, %340 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3051 = torch.aten.add.Tensor %3050, %341, %int1_2300 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3052 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2301 = torch.constant.int 1
%int7_2302 = torch.constant.int 7
%int4800_2303 = torch.constant.int 4800
%3053 = torch.prim.ListConstruct %int1_2301, %int7_2302, %int4800_2303 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3054 = torch.aten.reshape %3051, %3053 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3055 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3056 = torch.prim.tolist(%3055) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2304 = torch.constant.int 2
%3057 = torch.aten.split_with_sizes %3054, %3056, %int2_2304 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3058:3 = torch.prim.ListUnpack %3057 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3059 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2305 = torch.constant.int 1
%int7_2306 = torch.constant.int 7
%int25_2307 = torch.constant.int 25
%int64_2308 = torch.constant.int 64
%3060 = torch.prim.ListConstruct %int1_2305, %int7_2306, %int25_2307, %int64_2308 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3061 = torch.aten.reshape %3058#0, %3060 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2309 = torch.constant.int 1
%int2_2310 = torch.constant.int 2
%3062 = torch.aten.transpose.int %3061, %int1_2309, %int2_2310 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3063 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2311 = torch.constant.int 1
%int7_2312 = torch.constant.int 7
%int25_2313 = torch.constant.int 25
%int64_2314 = torch.constant.int 64
%3064 = torch.prim.ListConstruct %int1_2311, %int7_2312, %int25_2313, %int64_2314 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3065 = torch.aten.reshape %3058#1, %3064 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2315 = torch.constant.int 1
%int2_2316 = torch.constant.int 2
%3066 = torch.aten.transpose.int %3065, %int1_2315, %int2_2316 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3067 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2317 = torch.constant.int 1
%int7_2318 = torch.constant.int 7
%int25_2319 = torch.constant.int 25
%int64_2320 = torch.constant.int 64
%3068 = torch.prim.ListConstruct %int1_2317, %int7_2318, %int25_2319, %int64_2320 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3069 = torch.aten.reshape %3058#2, %3068 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2321 = torch.constant.int 1
%int2_2322 = torch.constant.int 2
%3070 = torch.aten.transpose.int %3069, %int1_2321, %int2_2322 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2323 = torch.constant.int 1
%int2_2324 = torch.constant.int 2
%3071 = torch.aten.transpose.int %3065, %int1_2323, %int2_2324 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2325 = torch.constant.int 2
%int3_2326 = torch.constant.int 3
%3072 = torch.aten.transpose.int %3071, %int2_2325, %int3_2326 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3073 = torch.aten.matmul %3062, %3072 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3074 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3075 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3076 = torch.aten.pow.Tensor_Tensor %3074, %3075 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3077 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2327 = torch.constant.int 0
%3078 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2328 = torch.constant.none
%float0.000000e00_2329 = torch.constant.float 0.000000e+00
%3079 = torch.aten.full %3078, %float0.000000e00_2329, %none_2328, %none_2328, %none_2328, %none_2328 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2330 = torch.constant.int 1
%3080 = torch.aten.add.Tensor %3079, %3076, %int1_2330 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3081 = torch.aten.div.Tensor %3073, %3080 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3082 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2331 = torch.constant.int 6
%none_2332 = torch.constant.none
%false_2333 = torch.constant.bool false
%3083 = torch.aten.to.dtype %3081, %int6_2331, %false_2333, %false_2333, %none_2332 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3084 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3085 = torch.aten.where.self %3082, %3083, %3084 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2334 = torch.constant.int 3
%none_2335 = torch.constant.none
%3086 = torch.aten.softmax.int %3085, %int3_2334, %none_2335 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2336 = torch.constant.int 6
%none_2337 = torch.constant.none
%false_2338 = torch.constant.bool false
%3087 = torch.aten.to.dtype %3086, %int6_2336, %false_2338, %false_2338, %none_2337 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3088 = torch.aten.matmul %3087, %3070 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2339 = torch.constant.int 1
%int2_2340 = torch.constant.int 2
%3089 = torch.aten.transpose.int %3088, %int1_2339, %int2_2340 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3090 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2341 = torch.constant.int 1
%int7_2342 = torch.constant.int 7
%int1600_2343 = torch.constant.int 1600
%3091 = torch.prim.ListConstruct %int1_2341, %int7_2342, %int1600_2343 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3092 = torch.aten.reshape %3089, %3091 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3093 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2344 = torch.constant.int 7
%int1600_2345 = torch.constant.int 1600
%3094 = torch.prim.ListConstruct %int7_2344, %int1600_2345 : (!torch.int, !torch.int) -> !torch.list<int>
%3095 = torch.aten.reshape %3092, %3094 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2346 = torch.constant.int 0
%int1_2347 = torch.constant.int 1
%3096 = torch.aten.mm %3095, %342 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3097 = torch.aten.add.Tensor %3096, %343, %int1_2347 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3098 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2348 = torch.constant.int 1
%int7_2349 = torch.constant.int 7
%int1600_2350 = torch.constant.int 1600
%3099 = torch.prim.ListConstruct %int1_2348, %int7_2349, %int1600_2350 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3100 = torch.aten.reshape %3097, %3099 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2351 = torch.constant.int 1
%3101 = torch.aten.add.Tensor %3100, %3045, %int1_2351 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2352 = torch.constant.float 9.9999997473787516E-6
%int1600_2353 = torch.constant.int 1600
%3102 = torch.prim.ListConstruct %int1600_2353 : (!torch.int) -> !torch.list<int>
%result0_2354, %result1_2355, %result2_2356 = torch.aten.native_layer_norm %3101, %3102, %344, %345, %float9.999990e-06_2352 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3103 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2357 = torch.constant.int 7
%int1600_2358 = torch.constant.int 1600
%3104 = torch.prim.ListConstruct %int7_2357, %int1600_2358 : (!torch.int, !torch.int) -> !torch.list<int>
%3105 = torch.aten.reshape %result0_2354, %3104 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2359 = torch.constant.int 0
%int1_2360 = torch.constant.int 1
%3106 = torch.aten.mm %3105, %346 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3107 = torch.aten.add.Tensor %3106, %347, %int1_2360 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3108 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2361 = torch.constant.int 1
%int7_2362 = torch.constant.int 7
%int6400_2363 = torch.constant.int 6400
%3109 = torch.prim.ListConstruct %int1_2361, %int7_2362, %int6400_2363 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3110 = torch.aten.reshape %3107, %3109 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3111 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3112 = torch.aten.mul.Tensor %3110, %3111 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3113 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3114 = torch.aten.pow.Tensor_Tensor %3110, %3113 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3115 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3116 = torch.aten.mul.Tensor %3114, %3115 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2364 = torch.constant.int 1
%3117 = torch.aten.add.Tensor %3110, %3116, %int1_2364 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3118 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3119 = torch.aten.mul.Tensor %3117, %3118 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3120 = torch.aten.tanh %3119 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3121 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2365 = torch.constant.int 1
%3122 = torch.aten.add.Tensor %3120, %3121, %int1_2365 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3123 = torch.aten.mul.Tensor %3112, %3122 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3124 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2366 = torch.constant.int 7
%int6400_2367 = torch.constant.int 6400
%3125 = torch.prim.ListConstruct %int7_2366, %int6400_2367 : (!torch.int, !torch.int) -> !torch.list<int>
%3126 = torch.aten.reshape %3123, %3125 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2368 = torch.constant.int 0
%int1_2369 = torch.constant.int 1
%3127 = torch.aten.mm %3126, %348 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3128 = torch.aten.add.Tensor %3127, %349, %int1_2369 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3129 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2370 = torch.constant.int 1
%int7_2371 = torch.constant.int 7
%int1600_2372 = torch.constant.int 1600
%3130 = torch.prim.ListConstruct %int1_2370, %int7_2371, %int1600_2372 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3131 = torch.aten.reshape %3128, %3130 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2373 = torch.constant.int 1
%3132 = torch.aten.add.Tensor %3101, %3131, %int1_2373 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2374 = torch.constant.float 9.9999997473787516E-6
%int1600_2375 = torch.constant.int 1600
%3133 = torch.prim.ListConstruct %int1600_2375 : (!torch.int) -> !torch.list<int>
%result0_2376, %result1_2377, %result2_2378 = torch.aten.native_layer_norm %3132, %3133, %350, %351, %float9.999990e-06_2374 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3134 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2379 = torch.constant.int 7
%int1600_2380 = torch.constant.int 1600
%3135 = torch.prim.ListConstruct %int7_2379, %int1600_2380 : (!torch.int, !torch.int) -> !torch.list<int>
%3136 = torch.aten.reshape %result0_2376, %3135 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2381 = torch.constant.int 0
%int1_2382 = torch.constant.int 1
%3137 = torch.aten.mm %3136, %352 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3138 = torch.aten.add.Tensor %3137, %353, %int1_2382 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3139 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2383 = torch.constant.int 1
%int7_2384 = torch.constant.int 7
%int4800_2385 = torch.constant.int 4800
%3140 = torch.prim.ListConstruct %int1_2383, %int7_2384, %int4800_2385 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3141 = torch.aten.reshape %3138, %3140 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3142 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3143 = torch.prim.tolist(%3142) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2386 = torch.constant.int 2
%3144 = torch.aten.split_with_sizes %3141, %3143, %int2_2386 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3145:3 = torch.prim.ListUnpack %3144 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3146 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2387 = torch.constant.int 1
%int7_2388 = torch.constant.int 7
%int25_2389 = torch.constant.int 25
%int64_2390 = torch.constant.int 64
%3147 = torch.prim.ListConstruct %int1_2387, %int7_2388, %int25_2389, %int64_2390 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3148 = torch.aten.reshape %3145#0, %3147 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2391 = torch.constant.int 1
%int2_2392 = torch.constant.int 2
%3149 = torch.aten.transpose.int %3148, %int1_2391, %int2_2392 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3150 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2393 = torch.constant.int 1
%int7_2394 = torch.constant.int 7
%int25_2395 = torch.constant.int 25
%int64_2396 = torch.constant.int 64
%3151 = torch.prim.ListConstruct %int1_2393, %int7_2394, %int25_2395, %int64_2396 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3152 = torch.aten.reshape %3145#1, %3151 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2397 = torch.constant.int 1
%int2_2398 = torch.constant.int 2
%3153 = torch.aten.transpose.int %3152, %int1_2397, %int2_2398 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3154 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2399 = torch.constant.int 1
%int7_2400 = torch.constant.int 7
%int25_2401 = torch.constant.int 25
%int64_2402 = torch.constant.int 64
%3155 = torch.prim.ListConstruct %int1_2399, %int7_2400, %int25_2401, %int64_2402 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3156 = torch.aten.reshape %3145#2, %3155 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2403 = torch.constant.int 1
%int2_2404 = torch.constant.int 2
%3157 = torch.aten.transpose.int %3156, %int1_2403, %int2_2404 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2405 = torch.constant.int 1
%int2_2406 = torch.constant.int 2
%3158 = torch.aten.transpose.int %3152, %int1_2405, %int2_2406 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2407 = torch.constant.int 2
%int3_2408 = torch.constant.int 3
%3159 = torch.aten.transpose.int %3158, %int2_2407, %int3_2408 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3160 = torch.aten.matmul %3149, %3159 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3161 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3162 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3163 = torch.aten.pow.Tensor_Tensor %3161, %3162 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3164 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2409 = torch.constant.int 0
%3165 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2410 = torch.constant.none
%float0.000000e00_2411 = torch.constant.float 0.000000e+00
%3166 = torch.aten.full %3165, %float0.000000e00_2411, %none_2410, %none_2410, %none_2410, %none_2410 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2412 = torch.constant.int 1
%3167 = torch.aten.add.Tensor %3166, %3163, %int1_2412 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3168 = torch.aten.div.Tensor %3160, %3167 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3169 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2413 = torch.constant.int 6
%none_2414 = torch.constant.none
%false_2415 = torch.constant.bool false
%3170 = torch.aten.to.dtype %3168, %int6_2413, %false_2415, %false_2415, %none_2414 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3171 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3172 = torch.aten.where.self %3169, %3170, %3171 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2416 = torch.constant.int 3
%none_2417 = torch.constant.none
%3173 = torch.aten.softmax.int %3172, %int3_2416, %none_2417 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2418 = torch.constant.int 6
%none_2419 = torch.constant.none
%false_2420 = torch.constant.bool false
%3174 = torch.aten.to.dtype %3173, %int6_2418, %false_2420, %false_2420, %none_2419 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3175 = torch.aten.matmul %3174, %3157 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2421 = torch.constant.int 1
%int2_2422 = torch.constant.int 2
%3176 = torch.aten.transpose.int %3175, %int1_2421, %int2_2422 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3177 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2423 = torch.constant.int 1
%int7_2424 = torch.constant.int 7
%int1600_2425 = torch.constant.int 1600
%3178 = torch.prim.ListConstruct %int1_2423, %int7_2424, %int1600_2425 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3179 = torch.aten.reshape %3176, %3178 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3180 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2426 = torch.constant.int 7
%int1600_2427 = torch.constant.int 1600
%3181 = torch.prim.ListConstruct %int7_2426, %int1600_2427 : (!torch.int, !torch.int) -> !torch.list<int>
%3182 = torch.aten.reshape %3179, %3181 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2428 = torch.constant.int 0
%int1_2429 = torch.constant.int 1
%3183 = torch.aten.mm %3182, %354 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3184 = torch.aten.add.Tensor %3183, %355, %int1_2429 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3185 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2430 = torch.constant.int 1
%int7_2431 = torch.constant.int 7
%int1600_2432 = torch.constant.int 1600
%3186 = torch.prim.ListConstruct %int1_2430, %int7_2431, %int1600_2432 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3187 = torch.aten.reshape %3184, %3186 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2433 = torch.constant.int 1
%3188 = torch.aten.add.Tensor %3187, %3132, %int1_2433 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2434 = torch.constant.float 9.9999997473787516E-6
%int1600_2435 = torch.constant.int 1600
%3189 = torch.prim.ListConstruct %int1600_2435 : (!torch.int) -> !torch.list<int>
%result0_2436, %result1_2437, %result2_2438 = torch.aten.native_layer_norm %3188, %3189, %356, %357, %float9.999990e-06_2434 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3190 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2439 = torch.constant.int 7
%int1600_2440 = torch.constant.int 1600
%3191 = torch.prim.ListConstruct %int7_2439, %int1600_2440 : (!torch.int, !torch.int) -> !torch.list<int>
%3192 = torch.aten.reshape %result0_2436, %3191 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2441 = torch.constant.int 0
%int1_2442 = torch.constant.int 1
%3193 = torch.aten.mm %3192, %358 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3194 = torch.aten.add.Tensor %3193, %359, %int1_2442 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3195 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2443 = torch.constant.int 1
%int7_2444 = torch.constant.int 7
%int6400_2445 = torch.constant.int 6400
%3196 = torch.prim.ListConstruct %int1_2443, %int7_2444, %int6400_2445 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3197 = torch.aten.reshape %3194, %3196 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3198 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3199 = torch.aten.mul.Tensor %3197, %3198 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3200 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3201 = torch.aten.pow.Tensor_Tensor %3197, %3200 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3202 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3203 = torch.aten.mul.Tensor %3201, %3202 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2446 = torch.constant.int 1
%3204 = torch.aten.add.Tensor %3197, %3203, %int1_2446 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3205 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3206 = torch.aten.mul.Tensor %3204, %3205 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3207 = torch.aten.tanh %3206 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3208 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2447 = torch.constant.int 1
%3209 = torch.aten.add.Tensor %3207, %3208, %int1_2447 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3210 = torch.aten.mul.Tensor %3199, %3209 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3211 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2448 = torch.constant.int 7
%int6400_2449 = torch.constant.int 6400
%3212 = torch.prim.ListConstruct %int7_2448, %int6400_2449 : (!torch.int, !torch.int) -> !torch.list<int>
%3213 = torch.aten.reshape %3210, %3212 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2450 = torch.constant.int 0
%int1_2451 = torch.constant.int 1
%3214 = torch.aten.mm %3213, %360 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3215 = torch.aten.add.Tensor %3214, %361, %int1_2451 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3216 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2452 = torch.constant.int 1
%int7_2453 = torch.constant.int 7
%int1600_2454 = torch.constant.int 1600
%3217 = torch.prim.ListConstruct %int1_2452, %int7_2453, %int1600_2454 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3218 = torch.aten.reshape %3215, %3217 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2455 = torch.constant.int 1
%3219 = torch.aten.add.Tensor %3188, %3218, %int1_2455 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2456 = torch.constant.float 9.9999997473787516E-6
%int1600_2457 = torch.constant.int 1600
%3220 = torch.prim.ListConstruct %int1600_2457 : (!torch.int) -> !torch.list<int>
%result0_2458, %result1_2459, %result2_2460 = torch.aten.native_layer_norm %3219, %3220, %362, %363, %float9.999990e-06_2456 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3221 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2461 = torch.constant.int 7
%int1600_2462 = torch.constant.int 1600
%3222 = torch.prim.ListConstruct %int7_2461, %int1600_2462 : (!torch.int, !torch.int) -> !torch.list<int>
%3223 = torch.aten.reshape %result0_2458, %3222 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2463 = torch.constant.int 0
%int1_2464 = torch.constant.int 1
%3224 = torch.aten.mm %3223, %364 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3225 = torch.aten.add.Tensor %3224, %365, %int1_2464 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3226 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2465 = torch.constant.int 1
%int7_2466 = torch.constant.int 7
%int4800_2467 = torch.constant.int 4800
%3227 = torch.prim.ListConstruct %int1_2465, %int7_2466, %int4800_2467 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3228 = torch.aten.reshape %3225, %3227 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3229 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3230 = torch.prim.tolist(%3229) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2468 = torch.constant.int 2
%3231 = torch.aten.split_with_sizes %3228, %3230, %int2_2468 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3232:3 = torch.prim.ListUnpack %3231 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3233 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2469 = torch.constant.int 1
%int7_2470 = torch.constant.int 7
%int25_2471 = torch.constant.int 25
%int64_2472 = torch.constant.int 64
%3234 = torch.prim.ListConstruct %int1_2469, %int7_2470, %int25_2471, %int64_2472 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3235 = torch.aten.reshape %3232#0, %3234 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2473 = torch.constant.int 1
%int2_2474 = torch.constant.int 2
%3236 = torch.aten.transpose.int %3235, %int1_2473, %int2_2474 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3237 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2475 = torch.constant.int 1
%int7_2476 = torch.constant.int 7
%int25_2477 = torch.constant.int 25
%int64_2478 = torch.constant.int 64
%3238 = torch.prim.ListConstruct %int1_2475, %int7_2476, %int25_2477, %int64_2478 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3239 = torch.aten.reshape %3232#1, %3238 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2479 = torch.constant.int 1
%int2_2480 = torch.constant.int 2
%3240 = torch.aten.transpose.int %3239, %int1_2479, %int2_2480 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3241 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2481 = torch.constant.int 1
%int7_2482 = torch.constant.int 7
%int25_2483 = torch.constant.int 25
%int64_2484 = torch.constant.int 64
%3242 = torch.prim.ListConstruct %int1_2481, %int7_2482, %int25_2483, %int64_2484 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3243 = torch.aten.reshape %3232#2, %3242 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2485 = torch.constant.int 1
%int2_2486 = torch.constant.int 2
%3244 = torch.aten.transpose.int %3243, %int1_2485, %int2_2486 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2487 = torch.constant.int 1
%int2_2488 = torch.constant.int 2
%3245 = torch.aten.transpose.int %3239, %int1_2487, %int2_2488 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2489 = torch.constant.int 2
%int3_2490 = torch.constant.int 3
%3246 = torch.aten.transpose.int %3245, %int2_2489, %int3_2490 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3247 = torch.aten.matmul %3236, %3246 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3248 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3249 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3250 = torch.aten.pow.Tensor_Tensor %3248, %3249 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3251 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2491 = torch.constant.int 0
%3252 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2492 = torch.constant.none
%float0.000000e00_2493 = torch.constant.float 0.000000e+00
%3253 = torch.aten.full %3252, %float0.000000e00_2493, %none_2492, %none_2492, %none_2492, %none_2492 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2494 = torch.constant.int 1
%3254 = torch.aten.add.Tensor %3253, %3250, %int1_2494 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3255 = torch.aten.div.Tensor %3247, %3254 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3256 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2495 = torch.constant.int 6
%none_2496 = torch.constant.none
%false_2497 = torch.constant.bool false
%3257 = torch.aten.to.dtype %3255, %int6_2495, %false_2497, %false_2497, %none_2496 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3258 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3259 = torch.aten.where.self %3256, %3257, %3258 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2498 = torch.constant.int 3
%none_2499 = torch.constant.none
%3260 = torch.aten.softmax.int %3259, %int3_2498, %none_2499 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2500 = torch.constant.int 6
%none_2501 = torch.constant.none
%false_2502 = torch.constant.bool false
%3261 = torch.aten.to.dtype %3260, %int6_2500, %false_2502, %false_2502, %none_2501 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3262 = torch.aten.matmul %3261, %3244 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2503 = torch.constant.int 1
%int2_2504 = torch.constant.int 2
%3263 = torch.aten.transpose.int %3262, %int1_2503, %int2_2504 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3264 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2505 = torch.constant.int 1
%int7_2506 = torch.constant.int 7
%int1600_2507 = torch.constant.int 1600
%3265 = torch.prim.ListConstruct %int1_2505, %int7_2506, %int1600_2507 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3266 = torch.aten.reshape %3263, %3265 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3267 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2508 = torch.constant.int 7
%int1600_2509 = torch.constant.int 1600
%3268 = torch.prim.ListConstruct %int7_2508, %int1600_2509 : (!torch.int, !torch.int) -> !torch.list<int>
%3269 = torch.aten.reshape %3266, %3268 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2510 = torch.constant.int 0
%int1_2511 = torch.constant.int 1
%3270 = torch.aten.mm %3269, %366 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3271 = torch.aten.add.Tensor %3270, %367, %int1_2511 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3272 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2512 = torch.constant.int 1
%int7_2513 = torch.constant.int 7
%int1600_2514 = torch.constant.int 1600
%3273 = torch.prim.ListConstruct %int1_2512, %int7_2513, %int1600_2514 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3274 = torch.aten.reshape %3271, %3273 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2515 = torch.constant.int 1
%3275 = torch.aten.add.Tensor %3274, %3219, %int1_2515 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2516 = torch.constant.float 9.9999997473787516E-6
%int1600_2517 = torch.constant.int 1600
%3276 = torch.prim.ListConstruct %int1600_2517 : (!torch.int) -> !torch.list<int>
%result0_2518, %result1_2519, %result2_2520 = torch.aten.native_layer_norm %3275, %3276, %368, %369, %float9.999990e-06_2516 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3277 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2521 = torch.constant.int 7
%int1600_2522 = torch.constant.int 1600
%3278 = torch.prim.ListConstruct %int7_2521, %int1600_2522 : (!torch.int, !torch.int) -> !torch.list<int>
%3279 = torch.aten.reshape %result0_2518, %3278 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2523 = torch.constant.int 0
%int1_2524 = torch.constant.int 1
%3280 = torch.aten.mm %3279, %370 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3281 = torch.aten.add.Tensor %3280, %371, %int1_2524 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3282 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2525 = torch.constant.int 1
%int7_2526 = torch.constant.int 7
%int6400_2527 = torch.constant.int 6400
%3283 = torch.prim.ListConstruct %int1_2525, %int7_2526, %int6400_2527 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3284 = torch.aten.reshape %3281, %3283 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3285 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3286 = torch.aten.mul.Tensor %3284, %3285 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3287 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3288 = torch.aten.pow.Tensor_Tensor %3284, %3287 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3289 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3290 = torch.aten.mul.Tensor %3288, %3289 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2528 = torch.constant.int 1
%3291 = torch.aten.add.Tensor %3284, %3290, %int1_2528 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3292 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3293 = torch.aten.mul.Tensor %3291, %3292 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3294 = torch.aten.tanh %3293 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3295 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2529 = torch.constant.int 1
%3296 = torch.aten.add.Tensor %3294, %3295, %int1_2529 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3297 = torch.aten.mul.Tensor %3286, %3296 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3298 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2530 = torch.constant.int 7
%int6400_2531 = torch.constant.int 6400
%3299 = torch.prim.ListConstruct %int7_2530, %int6400_2531 : (!torch.int, !torch.int) -> !torch.list<int>
%3300 = torch.aten.reshape %3297, %3299 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2532 = torch.constant.int 0
%int1_2533 = torch.constant.int 1
%3301 = torch.aten.mm %3300, %372 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3302 = torch.aten.add.Tensor %3301, %373, %int1_2533 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3303 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2534 = torch.constant.int 1
%int7_2535 = torch.constant.int 7
%int1600_2536 = torch.constant.int 1600
%3304 = torch.prim.ListConstruct %int1_2534, %int7_2535, %int1600_2536 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3305 = torch.aten.reshape %3302, %3304 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2537 = torch.constant.int 1
%3306 = torch.aten.add.Tensor %3275, %3305, %int1_2537 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2538 = torch.constant.float 9.9999997473787516E-6
%int1600_2539 = torch.constant.int 1600
%3307 = torch.prim.ListConstruct %int1600_2539 : (!torch.int) -> !torch.list<int>
%result0_2540, %result1_2541, %result2_2542 = torch.aten.native_layer_norm %3306, %3307, %374, %375, %float9.999990e-06_2538 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3308 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2543 = torch.constant.int 7
%int1600_2544 = torch.constant.int 1600
%3309 = torch.prim.ListConstruct %int7_2543, %int1600_2544 : (!torch.int, !torch.int) -> !torch.list<int>
%3310 = torch.aten.reshape %result0_2540, %3309 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2545 = torch.constant.int 0
%int1_2546 = torch.constant.int 1
%3311 = torch.aten.mm %3310, %376 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3312 = torch.aten.add.Tensor %3311, %377, %int1_2546 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3313 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2547 = torch.constant.int 1
%int7_2548 = torch.constant.int 7
%int4800_2549 = torch.constant.int 4800
%3314 = torch.prim.ListConstruct %int1_2547, %int7_2548, %int4800_2549 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3315 = torch.aten.reshape %3312, %3314 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3316 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3317 = torch.prim.tolist(%3316) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2550 = torch.constant.int 2
%3318 = torch.aten.split_with_sizes %3315, %3317, %int2_2550 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3319:3 = torch.prim.ListUnpack %3318 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3320 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2551 = torch.constant.int 1
%int7_2552 = torch.constant.int 7
%int25_2553 = torch.constant.int 25
%int64_2554 = torch.constant.int 64
%3321 = torch.prim.ListConstruct %int1_2551, %int7_2552, %int25_2553, %int64_2554 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3322 = torch.aten.reshape %3319#0, %3321 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2555 = torch.constant.int 1
%int2_2556 = torch.constant.int 2
%3323 = torch.aten.transpose.int %3322, %int1_2555, %int2_2556 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3324 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2557 = torch.constant.int 1
%int7_2558 = torch.constant.int 7
%int25_2559 = torch.constant.int 25
%int64_2560 = torch.constant.int 64
%3325 = torch.prim.ListConstruct %int1_2557, %int7_2558, %int25_2559, %int64_2560 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3326 = torch.aten.reshape %3319#1, %3325 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2561 = torch.constant.int 1
%int2_2562 = torch.constant.int 2
%3327 = torch.aten.transpose.int %3326, %int1_2561, %int2_2562 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3328 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2563 = torch.constant.int 1
%int7_2564 = torch.constant.int 7
%int25_2565 = torch.constant.int 25
%int64_2566 = torch.constant.int 64
%3329 = torch.prim.ListConstruct %int1_2563, %int7_2564, %int25_2565, %int64_2566 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3330 = torch.aten.reshape %3319#2, %3329 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2567 = torch.constant.int 1
%int2_2568 = torch.constant.int 2
%3331 = torch.aten.transpose.int %3330, %int1_2567, %int2_2568 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2569 = torch.constant.int 1
%int2_2570 = torch.constant.int 2
%3332 = torch.aten.transpose.int %3326, %int1_2569, %int2_2570 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2571 = torch.constant.int 2
%int3_2572 = torch.constant.int 3
%3333 = torch.aten.transpose.int %3332, %int2_2571, %int3_2572 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3334 = torch.aten.matmul %3323, %3333 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3335 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3336 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3337 = torch.aten.pow.Tensor_Tensor %3335, %3336 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3338 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2573 = torch.constant.int 0
%3339 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2574 = torch.constant.none
%float0.000000e00_2575 = torch.constant.float 0.000000e+00
%3340 = torch.aten.full %3339, %float0.000000e00_2575, %none_2574, %none_2574, %none_2574, %none_2574 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2576 = torch.constant.int 1
%3341 = torch.aten.add.Tensor %3340, %3337, %int1_2576 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3342 = torch.aten.div.Tensor %3334, %3341 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3343 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2577 = torch.constant.int 6
%none_2578 = torch.constant.none
%false_2579 = torch.constant.bool false
%3344 = torch.aten.to.dtype %3342, %int6_2577, %false_2579, %false_2579, %none_2578 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3345 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3346 = torch.aten.where.self %3343, %3344, %3345 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2580 = torch.constant.int 3
%none_2581 = torch.constant.none
%3347 = torch.aten.softmax.int %3346, %int3_2580, %none_2581 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2582 = torch.constant.int 6
%none_2583 = torch.constant.none
%false_2584 = torch.constant.bool false
%3348 = torch.aten.to.dtype %3347, %int6_2582, %false_2584, %false_2584, %none_2583 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3349 = torch.aten.matmul %3348, %3331 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2585 = torch.constant.int 1
%int2_2586 = torch.constant.int 2
%3350 = torch.aten.transpose.int %3349, %int1_2585, %int2_2586 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3351 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2587 = torch.constant.int 1
%int7_2588 = torch.constant.int 7
%int1600_2589 = torch.constant.int 1600
%3352 = torch.prim.ListConstruct %int1_2587, %int7_2588, %int1600_2589 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3353 = torch.aten.reshape %3350, %3352 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3354 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2590 = torch.constant.int 7
%int1600_2591 = torch.constant.int 1600
%3355 = torch.prim.ListConstruct %int7_2590, %int1600_2591 : (!torch.int, !torch.int) -> !torch.list<int>
%3356 = torch.aten.reshape %3353, %3355 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2592 = torch.constant.int 0
%int1_2593 = torch.constant.int 1
%3357 = torch.aten.mm %3356, %378 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3358 = torch.aten.add.Tensor %3357, %379, %int1_2593 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3359 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2594 = torch.constant.int 1
%int7_2595 = torch.constant.int 7
%int1600_2596 = torch.constant.int 1600
%3360 = torch.prim.ListConstruct %int1_2594, %int7_2595, %int1600_2596 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3361 = torch.aten.reshape %3358, %3360 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2597 = torch.constant.int 1
%3362 = torch.aten.add.Tensor %3361, %3306, %int1_2597 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2598 = torch.constant.float 9.9999997473787516E-6
%int1600_2599 = torch.constant.int 1600
%3363 = torch.prim.ListConstruct %int1600_2599 : (!torch.int) -> !torch.list<int>
%result0_2600, %result1_2601, %result2_2602 = torch.aten.native_layer_norm %3362, %3363, %380, %381, %float9.999990e-06_2598 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3364 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2603 = torch.constant.int 7
%int1600_2604 = torch.constant.int 1600
%3365 = torch.prim.ListConstruct %int7_2603, %int1600_2604 : (!torch.int, !torch.int) -> !torch.list<int>
%3366 = torch.aten.reshape %result0_2600, %3365 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2605 = torch.constant.int 0
%int1_2606 = torch.constant.int 1
%3367 = torch.aten.mm %3366, %382 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3368 = torch.aten.add.Tensor %3367, %383, %int1_2606 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3369 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2607 = torch.constant.int 1
%int7_2608 = torch.constant.int 7
%int6400_2609 = torch.constant.int 6400
%3370 = torch.prim.ListConstruct %int1_2607, %int7_2608, %int6400_2609 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3371 = torch.aten.reshape %3368, %3370 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3372 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3373 = torch.aten.mul.Tensor %3371, %3372 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3374 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3375 = torch.aten.pow.Tensor_Tensor %3371, %3374 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3376 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3377 = torch.aten.mul.Tensor %3375, %3376 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2610 = torch.constant.int 1
%3378 = torch.aten.add.Tensor %3371, %3377, %int1_2610 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3379 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3380 = torch.aten.mul.Tensor %3378, %3379 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3381 = torch.aten.tanh %3380 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3382 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2611 = torch.constant.int 1
%3383 = torch.aten.add.Tensor %3381, %3382, %int1_2611 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3384 = torch.aten.mul.Tensor %3373, %3383 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3385 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2612 = torch.constant.int 7
%int6400_2613 = torch.constant.int 6400
%3386 = torch.prim.ListConstruct %int7_2612, %int6400_2613 : (!torch.int, !torch.int) -> !torch.list<int>
%3387 = torch.aten.reshape %3384, %3386 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2614 = torch.constant.int 0
%int1_2615 = torch.constant.int 1
%3388 = torch.aten.mm %3387, %384 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3389 = torch.aten.add.Tensor %3388, %385, %int1_2615 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3390 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2616 = torch.constant.int 1
%int7_2617 = torch.constant.int 7
%int1600_2618 = torch.constant.int 1600
%3391 = torch.prim.ListConstruct %int1_2616, %int7_2617, %int1600_2618 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3392 = torch.aten.reshape %3389, %3391 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2619 = torch.constant.int 1
%3393 = torch.aten.add.Tensor %3362, %3392, %int1_2619 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2620 = torch.constant.float 9.9999997473787516E-6
%int1600_2621 = torch.constant.int 1600
%3394 = torch.prim.ListConstruct %int1600_2621 : (!torch.int) -> !torch.list<int>
%result0_2622, %result1_2623, %result2_2624 = torch.aten.native_layer_norm %3393, %3394, %386, %387, %float9.999990e-06_2620 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3395 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2625 = torch.constant.int 7
%int1600_2626 = torch.constant.int 1600
%3396 = torch.prim.ListConstruct %int7_2625, %int1600_2626 : (!torch.int, !torch.int) -> !torch.list<int>
%3397 = torch.aten.reshape %result0_2622, %3396 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2627 = torch.constant.int 0
%int1_2628 = torch.constant.int 1
%3398 = torch.aten.mm %3397, %388 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3399 = torch.aten.add.Tensor %3398, %389, %int1_2628 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3400 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2629 = torch.constant.int 1
%int7_2630 = torch.constant.int 7
%int4800_2631 = torch.constant.int 4800
%3401 = torch.prim.ListConstruct %int1_2629, %int7_2630, %int4800_2631 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3402 = torch.aten.reshape %3399, %3401 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3403 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3404 = torch.prim.tolist(%3403) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2632 = torch.constant.int 2
%3405 = torch.aten.split_with_sizes %3402, %3404, %int2_2632 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3406:3 = torch.prim.ListUnpack %3405 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3407 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2633 = torch.constant.int 1
%int7_2634 = torch.constant.int 7
%int25_2635 = torch.constant.int 25
%int64_2636 = torch.constant.int 64
%3408 = torch.prim.ListConstruct %int1_2633, %int7_2634, %int25_2635, %int64_2636 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3409 = torch.aten.reshape %3406#0, %3408 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2637 = torch.constant.int 1
%int2_2638 = torch.constant.int 2
%3410 = torch.aten.transpose.int %3409, %int1_2637, %int2_2638 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3411 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2639 = torch.constant.int 1
%int7_2640 = torch.constant.int 7
%int25_2641 = torch.constant.int 25
%int64_2642 = torch.constant.int 64
%3412 = torch.prim.ListConstruct %int1_2639, %int7_2640, %int25_2641, %int64_2642 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3413 = torch.aten.reshape %3406#1, %3412 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2643 = torch.constant.int 1
%int2_2644 = torch.constant.int 2
%3414 = torch.aten.transpose.int %3413, %int1_2643, %int2_2644 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3415 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2645 = torch.constant.int 1
%int7_2646 = torch.constant.int 7
%int25_2647 = torch.constant.int 25
%int64_2648 = torch.constant.int 64
%3416 = torch.prim.ListConstruct %int1_2645, %int7_2646, %int25_2647, %int64_2648 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3417 = torch.aten.reshape %3406#2, %3416 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2649 = torch.constant.int 1
%int2_2650 = torch.constant.int 2
%3418 = torch.aten.transpose.int %3417, %int1_2649, %int2_2650 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2651 = torch.constant.int 1
%int2_2652 = torch.constant.int 2
%3419 = torch.aten.transpose.int %3413, %int1_2651, %int2_2652 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2653 = torch.constant.int 2
%int3_2654 = torch.constant.int 3
%3420 = torch.aten.transpose.int %3419, %int2_2653, %int3_2654 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3421 = torch.aten.matmul %3410, %3420 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3422 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3423 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3424 = torch.aten.pow.Tensor_Tensor %3422, %3423 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3425 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2655 = torch.constant.int 0
%3426 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2656 = torch.constant.none
%float0.000000e00_2657 = torch.constant.float 0.000000e+00
%3427 = torch.aten.full %3426, %float0.000000e00_2657, %none_2656, %none_2656, %none_2656, %none_2656 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2658 = torch.constant.int 1
%3428 = torch.aten.add.Tensor %3427, %3424, %int1_2658 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3429 = torch.aten.div.Tensor %3421, %3428 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3430 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2659 = torch.constant.int 6
%none_2660 = torch.constant.none
%false_2661 = torch.constant.bool false
%3431 = torch.aten.to.dtype %3429, %int6_2659, %false_2661, %false_2661, %none_2660 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3432 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3433 = torch.aten.where.self %3430, %3431, %3432 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2662 = torch.constant.int 3
%none_2663 = torch.constant.none
%3434 = torch.aten.softmax.int %3433, %int3_2662, %none_2663 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2664 = torch.constant.int 6
%none_2665 = torch.constant.none
%false_2666 = torch.constant.bool false
%3435 = torch.aten.to.dtype %3434, %int6_2664, %false_2666, %false_2666, %none_2665 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3436 = torch.aten.matmul %3435, %3418 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2667 = torch.constant.int 1
%int2_2668 = torch.constant.int 2
%3437 = torch.aten.transpose.int %3436, %int1_2667, %int2_2668 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3438 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2669 = torch.constant.int 1
%int7_2670 = torch.constant.int 7
%int1600_2671 = torch.constant.int 1600
%3439 = torch.prim.ListConstruct %int1_2669, %int7_2670, %int1600_2671 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3440 = torch.aten.reshape %3437, %3439 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3441 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2672 = torch.constant.int 7
%int1600_2673 = torch.constant.int 1600
%3442 = torch.prim.ListConstruct %int7_2672, %int1600_2673 : (!torch.int, !torch.int) -> !torch.list<int>
%3443 = torch.aten.reshape %3440, %3442 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2674 = torch.constant.int 0
%int1_2675 = torch.constant.int 1
%3444 = torch.aten.mm %3443, %390 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3445 = torch.aten.add.Tensor %3444, %391, %int1_2675 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3446 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2676 = torch.constant.int 1
%int7_2677 = torch.constant.int 7
%int1600_2678 = torch.constant.int 1600
%3447 = torch.prim.ListConstruct %int1_2676, %int7_2677, %int1600_2678 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3448 = torch.aten.reshape %3445, %3447 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2679 = torch.constant.int 1
%3449 = torch.aten.add.Tensor %3448, %3393, %int1_2679 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2680 = torch.constant.float 9.9999997473787516E-6
%int1600_2681 = torch.constant.int 1600
%3450 = torch.prim.ListConstruct %int1600_2681 : (!torch.int) -> !torch.list<int>
%result0_2682, %result1_2683, %result2_2684 = torch.aten.native_layer_norm %3449, %3450, %392, %393, %float9.999990e-06_2680 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3451 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2685 = torch.constant.int 7
%int1600_2686 = torch.constant.int 1600
%3452 = torch.prim.ListConstruct %int7_2685, %int1600_2686 : (!torch.int, !torch.int) -> !torch.list<int>
%3453 = torch.aten.reshape %result0_2682, %3452 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2687 = torch.constant.int 0
%int1_2688 = torch.constant.int 1
%3454 = torch.aten.mm %3453, %394 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3455 = torch.aten.add.Tensor %3454, %395, %int1_2688 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3456 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2689 = torch.constant.int 1
%int7_2690 = torch.constant.int 7
%int6400_2691 = torch.constant.int 6400
%3457 = torch.prim.ListConstruct %int1_2689, %int7_2690, %int6400_2691 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3458 = torch.aten.reshape %3455, %3457 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3459 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3460 = torch.aten.mul.Tensor %3458, %3459 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3461 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3462 = torch.aten.pow.Tensor_Tensor %3458, %3461 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3463 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3464 = torch.aten.mul.Tensor %3462, %3463 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2692 = torch.constant.int 1
%3465 = torch.aten.add.Tensor %3458, %3464, %int1_2692 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3466 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3467 = torch.aten.mul.Tensor %3465, %3466 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3468 = torch.aten.tanh %3467 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3469 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2693 = torch.constant.int 1
%3470 = torch.aten.add.Tensor %3468, %3469, %int1_2693 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3471 = torch.aten.mul.Tensor %3460, %3470 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3472 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2694 = torch.constant.int 7
%int6400_2695 = torch.constant.int 6400
%3473 = torch.prim.ListConstruct %int7_2694, %int6400_2695 : (!torch.int, !torch.int) -> !torch.list<int>
%3474 = torch.aten.reshape %3471, %3473 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2696 = torch.constant.int 0
%int1_2697 = torch.constant.int 1
%3475 = torch.aten.mm %3474, %396 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3476 = torch.aten.add.Tensor %3475, %397, %int1_2697 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3477 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2698 = torch.constant.int 1
%int7_2699 = torch.constant.int 7
%int1600_2700 = torch.constant.int 1600
%3478 = torch.prim.ListConstruct %int1_2698, %int7_2699, %int1600_2700 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3479 = torch.aten.reshape %3476, %3478 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2701 = torch.constant.int 1
%3480 = torch.aten.add.Tensor %3449, %3479, %int1_2701 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2702 = torch.constant.float 9.9999997473787516E-6
%int1600_2703 = torch.constant.int 1600
%3481 = torch.prim.ListConstruct %int1600_2703 : (!torch.int) -> !torch.list<int>
%result0_2704, %result1_2705, %result2_2706 = torch.aten.native_layer_norm %3480, %3481, %398, %399, %float9.999990e-06_2702 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3482 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2707 = torch.constant.int 7
%int1600_2708 = torch.constant.int 1600
%3483 = torch.prim.ListConstruct %int7_2707, %int1600_2708 : (!torch.int, !torch.int) -> !torch.list<int>
%3484 = torch.aten.reshape %result0_2704, %3483 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2709 = torch.constant.int 0
%int1_2710 = torch.constant.int 1
%3485 = torch.aten.mm %3484, %400 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3486 = torch.aten.add.Tensor %3485, %401, %int1_2710 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3487 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2711 = torch.constant.int 1
%int7_2712 = torch.constant.int 7
%int4800_2713 = torch.constant.int 4800
%3488 = torch.prim.ListConstruct %int1_2711, %int7_2712, %int4800_2713 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3489 = torch.aten.reshape %3486, %3488 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3490 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3491 = torch.prim.tolist(%3490) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2714 = torch.constant.int 2
%3492 = torch.aten.split_with_sizes %3489, %3491, %int2_2714 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3493:3 = torch.prim.ListUnpack %3492 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3494 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2715 = torch.constant.int 1
%int7_2716 = torch.constant.int 7
%int25_2717 = torch.constant.int 25
%int64_2718 = torch.constant.int 64
%3495 = torch.prim.ListConstruct %int1_2715, %int7_2716, %int25_2717, %int64_2718 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3496 = torch.aten.reshape %3493#0, %3495 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2719 = torch.constant.int 1
%int2_2720 = torch.constant.int 2
%3497 = torch.aten.transpose.int %3496, %int1_2719, %int2_2720 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3498 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2721 = torch.constant.int 1
%int7_2722 = torch.constant.int 7
%int25_2723 = torch.constant.int 25
%int64_2724 = torch.constant.int 64
%3499 = torch.prim.ListConstruct %int1_2721, %int7_2722, %int25_2723, %int64_2724 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3500 = torch.aten.reshape %3493#1, %3499 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2725 = torch.constant.int 1
%int2_2726 = torch.constant.int 2
%3501 = torch.aten.transpose.int %3500, %int1_2725, %int2_2726 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3502 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2727 = torch.constant.int 1
%int7_2728 = torch.constant.int 7
%int25_2729 = torch.constant.int 25
%int64_2730 = torch.constant.int 64
%3503 = torch.prim.ListConstruct %int1_2727, %int7_2728, %int25_2729, %int64_2730 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3504 = torch.aten.reshape %3493#2, %3503 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2731 = torch.constant.int 1
%int2_2732 = torch.constant.int 2
%3505 = torch.aten.transpose.int %3504, %int1_2731, %int2_2732 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2733 = torch.constant.int 1
%int2_2734 = torch.constant.int 2
%3506 = torch.aten.transpose.int %3500, %int1_2733, %int2_2734 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2735 = torch.constant.int 2
%int3_2736 = torch.constant.int 3
%3507 = torch.aten.transpose.int %3506, %int2_2735, %int3_2736 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3508 = torch.aten.matmul %3497, %3507 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3509 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3510 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3511 = torch.aten.pow.Tensor_Tensor %3509, %3510 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3512 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2737 = torch.constant.int 0
%3513 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2738 = torch.constant.none
%float0.000000e00_2739 = torch.constant.float 0.000000e+00
%3514 = torch.aten.full %3513, %float0.000000e00_2739, %none_2738, %none_2738, %none_2738, %none_2738 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2740 = torch.constant.int 1
%3515 = torch.aten.add.Tensor %3514, %3511, %int1_2740 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3516 = torch.aten.div.Tensor %3508, %3515 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3517 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2741 = torch.constant.int 6
%none_2742 = torch.constant.none
%false_2743 = torch.constant.bool false
%3518 = torch.aten.to.dtype %3516, %int6_2741, %false_2743, %false_2743, %none_2742 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3519 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3520 = torch.aten.where.self %3517, %3518, %3519 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2744 = torch.constant.int 3
%none_2745 = torch.constant.none
%3521 = torch.aten.softmax.int %3520, %int3_2744, %none_2745 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2746 = torch.constant.int 6
%none_2747 = torch.constant.none
%false_2748 = torch.constant.bool false
%3522 = torch.aten.to.dtype %3521, %int6_2746, %false_2748, %false_2748, %none_2747 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3523 = torch.aten.matmul %3522, %3505 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2749 = torch.constant.int 1
%int2_2750 = torch.constant.int 2
%3524 = torch.aten.transpose.int %3523, %int1_2749, %int2_2750 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3525 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2751 = torch.constant.int 1
%int7_2752 = torch.constant.int 7
%int1600_2753 = torch.constant.int 1600
%3526 = torch.prim.ListConstruct %int1_2751, %int7_2752, %int1600_2753 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3527 = torch.aten.reshape %3524, %3526 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3528 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2754 = torch.constant.int 7
%int1600_2755 = torch.constant.int 1600
%3529 = torch.prim.ListConstruct %int7_2754, %int1600_2755 : (!torch.int, !torch.int) -> !torch.list<int>
%3530 = torch.aten.reshape %3527, %3529 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2756 = torch.constant.int 0
%int1_2757 = torch.constant.int 1
%3531 = torch.aten.mm %3530, %402 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3532 = torch.aten.add.Tensor %3531, %403, %int1_2757 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3533 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2758 = torch.constant.int 1
%int7_2759 = torch.constant.int 7
%int1600_2760 = torch.constant.int 1600
%3534 = torch.prim.ListConstruct %int1_2758, %int7_2759, %int1600_2760 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3535 = torch.aten.reshape %3532, %3534 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2761 = torch.constant.int 1
%3536 = torch.aten.add.Tensor %3535, %3480, %int1_2761 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2762 = torch.constant.float 9.9999997473787516E-6
%int1600_2763 = torch.constant.int 1600
%3537 = torch.prim.ListConstruct %int1600_2763 : (!torch.int) -> !torch.list<int>
%result0_2764, %result1_2765, %result2_2766 = torch.aten.native_layer_norm %3536, %3537, %404, %405, %float9.999990e-06_2762 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3538 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2767 = torch.constant.int 7
%int1600_2768 = torch.constant.int 1600
%3539 = torch.prim.ListConstruct %int7_2767, %int1600_2768 : (!torch.int, !torch.int) -> !torch.list<int>
%3540 = torch.aten.reshape %result0_2764, %3539 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2769 = torch.constant.int 0
%int1_2770 = torch.constant.int 1
%3541 = torch.aten.mm %3540, %406 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3542 = torch.aten.add.Tensor %3541, %407, %int1_2770 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3543 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2771 = torch.constant.int 1
%int7_2772 = torch.constant.int 7
%int6400_2773 = torch.constant.int 6400
%3544 = torch.prim.ListConstruct %int1_2771, %int7_2772, %int6400_2773 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3545 = torch.aten.reshape %3542, %3544 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3546 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3547 = torch.aten.mul.Tensor %3545, %3546 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3548 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3549 = torch.aten.pow.Tensor_Tensor %3545, %3548 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3550 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3551 = torch.aten.mul.Tensor %3549, %3550 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2774 = torch.constant.int 1
%3552 = torch.aten.add.Tensor %3545, %3551, %int1_2774 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3553 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3554 = torch.aten.mul.Tensor %3552, %3553 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3555 = torch.aten.tanh %3554 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3556 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2775 = torch.constant.int 1
%3557 = torch.aten.add.Tensor %3555, %3556, %int1_2775 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3558 = torch.aten.mul.Tensor %3547, %3557 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3559 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2776 = torch.constant.int 7
%int6400_2777 = torch.constant.int 6400
%3560 = torch.prim.ListConstruct %int7_2776, %int6400_2777 : (!torch.int, !torch.int) -> !torch.list<int>
%3561 = torch.aten.reshape %3558, %3560 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2778 = torch.constant.int 0
%int1_2779 = torch.constant.int 1
%3562 = torch.aten.mm %3561, %408 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3563 = torch.aten.add.Tensor %3562, %409, %int1_2779 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3564 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2780 = torch.constant.int 1
%int7_2781 = torch.constant.int 7
%int1600_2782 = torch.constant.int 1600
%3565 = torch.prim.ListConstruct %int1_2780, %int7_2781, %int1600_2782 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3566 = torch.aten.reshape %3563, %3565 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2783 = torch.constant.int 1
%3567 = torch.aten.add.Tensor %3536, %3566, %int1_2783 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2784 = torch.constant.float 9.9999997473787516E-6
%int1600_2785 = torch.constant.int 1600
%3568 = torch.prim.ListConstruct %int1600_2785 : (!torch.int) -> !torch.list<int>
%result0_2786, %result1_2787, %result2_2788 = torch.aten.native_layer_norm %3567, %3568, %410, %411, %float9.999990e-06_2784 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3569 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2789 = torch.constant.int 7
%int1600_2790 = torch.constant.int 1600
%3570 = torch.prim.ListConstruct %int7_2789, %int1600_2790 : (!torch.int, !torch.int) -> !torch.list<int>
%3571 = torch.aten.reshape %result0_2786, %3570 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2791 = torch.constant.int 0
%int1_2792 = torch.constant.int 1
%3572 = torch.aten.mm %3571, %412 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3573 = torch.aten.add.Tensor %3572, %413, %int1_2792 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3574 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2793 = torch.constant.int 1
%int7_2794 = torch.constant.int 7
%int4800_2795 = torch.constant.int 4800
%3575 = torch.prim.ListConstruct %int1_2793, %int7_2794, %int4800_2795 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3576 = torch.aten.reshape %3573, %3575 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3577 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3578 = torch.prim.tolist(%3577) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2796 = torch.constant.int 2
%3579 = torch.aten.split_with_sizes %3576, %3578, %int2_2796 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3580:3 = torch.prim.ListUnpack %3579 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3581 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2797 = torch.constant.int 1
%int7_2798 = torch.constant.int 7
%int25_2799 = torch.constant.int 25
%int64_2800 = torch.constant.int 64
%3582 = torch.prim.ListConstruct %int1_2797, %int7_2798, %int25_2799, %int64_2800 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3583 = torch.aten.reshape %3580#0, %3582 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2801 = torch.constant.int 1
%int2_2802 = torch.constant.int 2
%3584 = torch.aten.transpose.int %3583, %int1_2801, %int2_2802 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3585 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2803 = torch.constant.int 1
%int7_2804 = torch.constant.int 7
%int25_2805 = torch.constant.int 25
%int64_2806 = torch.constant.int 64
%3586 = torch.prim.ListConstruct %int1_2803, %int7_2804, %int25_2805, %int64_2806 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3587 = torch.aten.reshape %3580#1, %3586 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2807 = torch.constant.int 1
%int2_2808 = torch.constant.int 2
%3588 = torch.aten.transpose.int %3587, %int1_2807, %int2_2808 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3589 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2809 = torch.constant.int 1
%int7_2810 = torch.constant.int 7
%int25_2811 = torch.constant.int 25
%int64_2812 = torch.constant.int 64
%3590 = torch.prim.ListConstruct %int1_2809, %int7_2810, %int25_2811, %int64_2812 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3591 = torch.aten.reshape %3580#2, %3590 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2813 = torch.constant.int 1
%int2_2814 = torch.constant.int 2
%3592 = torch.aten.transpose.int %3591, %int1_2813, %int2_2814 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2815 = torch.constant.int 1
%int2_2816 = torch.constant.int 2
%3593 = torch.aten.transpose.int %3587, %int1_2815, %int2_2816 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2817 = torch.constant.int 2
%int3_2818 = torch.constant.int 3
%3594 = torch.aten.transpose.int %3593, %int2_2817, %int3_2818 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3595 = torch.aten.matmul %3584, %3594 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3596 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3597 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3598 = torch.aten.pow.Tensor_Tensor %3596, %3597 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3599 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2819 = torch.constant.int 0
%3600 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2820 = torch.constant.none
%float0.000000e00_2821 = torch.constant.float 0.000000e+00
%3601 = torch.aten.full %3600, %float0.000000e00_2821, %none_2820, %none_2820, %none_2820, %none_2820 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2822 = torch.constant.int 1
%3602 = torch.aten.add.Tensor %3601, %3598, %int1_2822 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3603 = torch.aten.div.Tensor %3595, %3602 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3604 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2823 = torch.constant.int 6
%none_2824 = torch.constant.none
%false_2825 = torch.constant.bool false
%3605 = torch.aten.to.dtype %3603, %int6_2823, %false_2825, %false_2825, %none_2824 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3606 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3607 = torch.aten.where.self %3604, %3605, %3606 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2826 = torch.constant.int 3
%none_2827 = torch.constant.none
%3608 = torch.aten.softmax.int %3607, %int3_2826, %none_2827 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2828 = torch.constant.int 6
%none_2829 = torch.constant.none
%false_2830 = torch.constant.bool false
%3609 = torch.aten.to.dtype %3608, %int6_2828, %false_2830, %false_2830, %none_2829 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3610 = torch.aten.matmul %3609, %3592 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2831 = torch.constant.int 1
%int2_2832 = torch.constant.int 2
%3611 = torch.aten.transpose.int %3610, %int1_2831, %int2_2832 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3612 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2833 = torch.constant.int 1
%int7_2834 = torch.constant.int 7
%int1600_2835 = torch.constant.int 1600
%3613 = torch.prim.ListConstruct %int1_2833, %int7_2834, %int1600_2835 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3614 = torch.aten.reshape %3611, %3613 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3615 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2836 = torch.constant.int 7
%int1600_2837 = torch.constant.int 1600
%3616 = torch.prim.ListConstruct %int7_2836, %int1600_2837 : (!torch.int, !torch.int) -> !torch.list<int>
%3617 = torch.aten.reshape %3614, %3616 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2838 = torch.constant.int 0
%int1_2839 = torch.constant.int 1
%3618 = torch.aten.mm %3617, %414 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3619 = torch.aten.add.Tensor %3618, %415, %int1_2839 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3620 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2840 = torch.constant.int 1
%int7_2841 = torch.constant.int 7
%int1600_2842 = torch.constant.int 1600
%3621 = torch.prim.ListConstruct %int1_2840, %int7_2841, %int1600_2842 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3622 = torch.aten.reshape %3619, %3621 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2843 = torch.constant.int 1
%3623 = torch.aten.add.Tensor %3622, %3567, %int1_2843 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2844 = torch.constant.float 9.9999997473787516E-6
%int1600_2845 = torch.constant.int 1600
%3624 = torch.prim.ListConstruct %int1600_2845 : (!torch.int) -> !torch.list<int>
%result0_2846, %result1_2847, %result2_2848 = torch.aten.native_layer_norm %3623, %3624, %416, %417, %float9.999990e-06_2844 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3625 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2849 = torch.constant.int 7
%int1600_2850 = torch.constant.int 1600
%3626 = torch.prim.ListConstruct %int7_2849, %int1600_2850 : (!torch.int, !torch.int) -> !torch.list<int>
%3627 = torch.aten.reshape %result0_2846, %3626 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2851 = torch.constant.int 0
%int1_2852 = torch.constant.int 1
%3628 = torch.aten.mm %3627, %418 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3629 = torch.aten.add.Tensor %3628, %419, %int1_2852 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3630 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2853 = torch.constant.int 1
%int7_2854 = torch.constant.int 7
%int6400_2855 = torch.constant.int 6400
%3631 = torch.prim.ListConstruct %int1_2853, %int7_2854, %int6400_2855 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3632 = torch.aten.reshape %3629, %3631 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3633 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3634 = torch.aten.mul.Tensor %3632, %3633 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3635 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3636 = torch.aten.pow.Tensor_Tensor %3632, %3635 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3637 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3638 = torch.aten.mul.Tensor %3636, %3637 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2856 = torch.constant.int 1
%3639 = torch.aten.add.Tensor %3632, %3638, %int1_2856 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3640 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3641 = torch.aten.mul.Tensor %3639, %3640 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3642 = torch.aten.tanh %3641 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3643 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2857 = torch.constant.int 1
%3644 = torch.aten.add.Tensor %3642, %3643, %int1_2857 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3645 = torch.aten.mul.Tensor %3634, %3644 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3646 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2858 = torch.constant.int 7
%int6400_2859 = torch.constant.int 6400
%3647 = torch.prim.ListConstruct %int7_2858, %int6400_2859 : (!torch.int, !torch.int) -> !torch.list<int>
%3648 = torch.aten.reshape %3645, %3647 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2860 = torch.constant.int 0
%int1_2861 = torch.constant.int 1
%3649 = torch.aten.mm %3648, %420 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3650 = torch.aten.add.Tensor %3649, %421, %int1_2861 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3651 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2862 = torch.constant.int 1
%int7_2863 = torch.constant.int 7
%int1600_2864 = torch.constant.int 1600
%3652 = torch.prim.ListConstruct %int1_2862, %int7_2863, %int1600_2864 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3653 = torch.aten.reshape %3650, %3652 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2865 = torch.constant.int 1
%3654 = torch.aten.add.Tensor %3623, %3653, %int1_2865 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2866 = torch.constant.float 9.9999997473787516E-6
%int1600_2867 = torch.constant.int 1600
%3655 = torch.prim.ListConstruct %int1600_2867 : (!torch.int) -> !torch.list<int>
%result0_2868, %result1_2869, %result2_2870 = torch.aten.native_layer_norm %3654, %3655, %422, %423, %float9.999990e-06_2866 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3656 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2871 = torch.constant.int 7
%int1600_2872 = torch.constant.int 1600
%3657 = torch.prim.ListConstruct %int7_2871, %int1600_2872 : (!torch.int, !torch.int) -> !torch.list<int>
%3658 = torch.aten.reshape %result0_2868, %3657 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2873 = torch.constant.int 0
%int1_2874 = torch.constant.int 1
%3659 = torch.aten.mm %3658, %424 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3660 = torch.aten.add.Tensor %3659, %425, %int1_2874 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3661 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2875 = torch.constant.int 1
%int7_2876 = torch.constant.int 7
%int4800_2877 = torch.constant.int 4800
%3662 = torch.prim.ListConstruct %int1_2875, %int7_2876, %int4800_2877 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3663 = torch.aten.reshape %3660, %3662 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3664 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3665 = torch.prim.tolist(%3664) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2878 = torch.constant.int 2
%3666 = torch.aten.split_with_sizes %3663, %3665, %int2_2878 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3667:3 = torch.prim.ListUnpack %3666 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3668 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2879 = torch.constant.int 1
%int7_2880 = torch.constant.int 7
%int25_2881 = torch.constant.int 25
%int64_2882 = torch.constant.int 64
%3669 = torch.prim.ListConstruct %int1_2879, %int7_2880, %int25_2881, %int64_2882 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3670 = torch.aten.reshape %3667#0, %3669 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2883 = torch.constant.int 1
%int2_2884 = torch.constant.int 2
%3671 = torch.aten.transpose.int %3670, %int1_2883, %int2_2884 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3672 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2885 = torch.constant.int 1
%int7_2886 = torch.constant.int 7
%int25_2887 = torch.constant.int 25
%int64_2888 = torch.constant.int 64
%3673 = torch.prim.ListConstruct %int1_2885, %int7_2886, %int25_2887, %int64_2888 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3674 = torch.aten.reshape %3667#1, %3673 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2889 = torch.constant.int 1
%int2_2890 = torch.constant.int 2
%3675 = torch.aten.transpose.int %3674, %int1_2889, %int2_2890 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3676 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2891 = torch.constant.int 1
%int7_2892 = torch.constant.int 7
%int25_2893 = torch.constant.int 25
%int64_2894 = torch.constant.int 64
%3677 = torch.prim.ListConstruct %int1_2891, %int7_2892, %int25_2893, %int64_2894 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3678 = torch.aten.reshape %3667#2, %3677 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2895 = torch.constant.int 1
%int2_2896 = torch.constant.int 2
%3679 = torch.aten.transpose.int %3678, %int1_2895, %int2_2896 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2897 = torch.constant.int 1
%int2_2898 = torch.constant.int 2
%3680 = torch.aten.transpose.int %3674, %int1_2897, %int2_2898 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2899 = torch.constant.int 2
%int3_2900 = torch.constant.int 3
%3681 = torch.aten.transpose.int %3680, %int2_2899, %int3_2900 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3682 = torch.aten.matmul %3671, %3681 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3683 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3684 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3685 = torch.aten.pow.Tensor_Tensor %3683, %3684 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3686 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2901 = torch.constant.int 0
%3687 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2902 = torch.constant.none
%float0.000000e00_2903 = torch.constant.float 0.000000e+00
%3688 = torch.aten.full %3687, %float0.000000e00_2903, %none_2902, %none_2902, %none_2902, %none_2902 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2904 = torch.constant.int 1
%3689 = torch.aten.add.Tensor %3688, %3685, %int1_2904 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3690 = torch.aten.div.Tensor %3682, %3689 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3691 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2905 = torch.constant.int 6
%none_2906 = torch.constant.none
%false_2907 = torch.constant.bool false
%3692 = torch.aten.to.dtype %3690, %int6_2905, %false_2907, %false_2907, %none_2906 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3693 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3694 = torch.aten.where.self %3691, %3692, %3693 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2908 = torch.constant.int 3
%none_2909 = torch.constant.none
%3695 = torch.aten.softmax.int %3694, %int3_2908, %none_2909 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2910 = torch.constant.int 6
%none_2911 = torch.constant.none
%false_2912 = torch.constant.bool false
%3696 = torch.aten.to.dtype %3695, %int6_2910, %false_2912, %false_2912, %none_2911 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3697 = torch.aten.matmul %3696, %3679 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2913 = torch.constant.int 1
%int2_2914 = torch.constant.int 2
%3698 = torch.aten.transpose.int %3697, %int1_2913, %int2_2914 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3699 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2915 = torch.constant.int 1
%int7_2916 = torch.constant.int 7
%int1600_2917 = torch.constant.int 1600
%3700 = torch.prim.ListConstruct %int1_2915, %int7_2916, %int1600_2917 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3701 = torch.aten.reshape %3698, %3700 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3702 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2918 = torch.constant.int 7
%int1600_2919 = torch.constant.int 1600
%3703 = torch.prim.ListConstruct %int7_2918, %int1600_2919 : (!torch.int, !torch.int) -> !torch.list<int>
%3704 = torch.aten.reshape %3701, %3703 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2920 = torch.constant.int 0
%int1_2921 = torch.constant.int 1
%3705 = torch.aten.mm %3704, %426 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3706 = torch.aten.add.Tensor %3705, %427, %int1_2921 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3707 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2922 = torch.constant.int 1
%int7_2923 = torch.constant.int 7
%int1600_2924 = torch.constant.int 1600
%3708 = torch.prim.ListConstruct %int1_2922, %int7_2923, %int1600_2924 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3709 = torch.aten.reshape %3706, %3708 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2925 = torch.constant.int 1
%3710 = torch.aten.add.Tensor %3709, %3654, %int1_2925 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2926 = torch.constant.float 9.9999997473787516E-6
%int1600_2927 = torch.constant.int 1600
%3711 = torch.prim.ListConstruct %int1600_2927 : (!torch.int) -> !torch.list<int>
%result0_2928, %result1_2929, %result2_2930 = torch.aten.native_layer_norm %3710, %3711, %428, %429, %float9.999990e-06_2926 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3712 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2931 = torch.constant.int 7
%int1600_2932 = torch.constant.int 1600
%3713 = torch.prim.ListConstruct %int7_2931, %int1600_2932 : (!torch.int, !torch.int) -> !torch.list<int>
%3714 = torch.aten.reshape %result0_2928, %3713 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2933 = torch.constant.int 0
%int1_2934 = torch.constant.int 1
%3715 = torch.aten.mm %3714, %430 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3716 = torch.aten.add.Tensor %3715, %431, %int1_2934 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3717 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2935 = torch.constant.int 1
%int7_2936 = torch.constant.int 7
%int6400_2937 = torch.constant.int 6400
%3718 = torch.prim.ListConstruct %int1_2935, %int7_2936, %int6400_2937 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3719 = torch.aten.reshape %3716, %3718 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3720 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3721 = torch.aten.mul.Tensor %3719, %3720 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3722 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3723 = torch.aten.pow.Tensor_Tensor %3719, %3722 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3724 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3725 = torch.aten.mul.Tensor %3723, %3724 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_2938 = torch.constant.int 1
%3726 = torch.aten.add.Tensor %3719, %3725, %int1_2938 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3727 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3728 = torch.aten.mul.Tensor %3726, %3727 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3729 = torch.aten.tanh %3728 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3730 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_2939 = torch.constant.int 1
%3731 = torch.aten.add.Tensor %3729, %3730, %int1_2939 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3732 = torch.aten.mul.Tensor %3721, %3731 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3733 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2940 = torch.constant.int 7
%int6400_2941 = torch.constant.int 6400
%3734 = torch.prim.ListConstruct %int7_2940, %int6400_2941 : (!torch.int, !torch.int) -> !torch.list<int>
%3735 = torch.aten.reshape %3732, %3734 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_2942 = torch.constant.int 0
%int1_2943 = torch.constant.int 1
%3736 = torch.aten.mm %3735, %432 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3737 = torch.aten.add.Tensor %3736, %433, %int1_2943 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3738 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2944 = torch.constant.int 1
%int7_2945 = torch.constant.int 7
%int1600_2946 = torch.constant.int 1600
%3739 = torch.prim.ListConstruct %int1_2944, %int7_2945, %int1600_2946 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3740 = torch.aten.reshape %3737, %3739 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_2947 = torch.constant.int 1
%3741 = torch.aten.add.Tensor %3710, %3740, %int1_2947 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_2948 = torch.constant.float 9.9999997473787516E-6
%int1600_2949 = torch.constant.int 1600
%3742 = torch.prim.ListConstruct %int1600_2949 : (!torch.int) -> !torch.list<int>
%result0_2950, %result1_2951, %result2_2952 = torch.aten.native_layer_norm %3741, %3742, %434, %435, %float9.999990e-06_2948 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3743 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_2953 = torch.constant.int 7
%int1600_2954 = torch.constant.int 1600
%3744 = torch.prim.ListConstruct %int7_2953, %int1600_2954 : (!torch.int, !torch.int) -> !torch.list<int>
%3745 = torch.aten.reshape %result0_2950, %3744 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_2955 = torch.constant.int 0
%int1_2956 = torch.constant.int 1
%3746 = torch.aten.mm %3745, %436 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3747 = torch.aten.add.Tensor %3746, %437, %int1_2956 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3748 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2957 = torch.constant.int 1
%int7_2958 = torch.constant.int 7
%int4800_2959 = torch.constant.int 4800
%3749 = torch.prim.ListConstruct %int1_2957, %int7_2958, %int4800_2959 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3750 = torch.aten.reshape %3747, %3749 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3751 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3752 = torch.prim.tolist(%3751) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_2960 = torch.constant.int 2
%3753 = torch.aten.split_with_sizes %3750, %3752, %int2_2960 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3754:3 = torch.prim.ListUnpack %3753 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3755 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2961 = torch.constant.int 1
%int7_2962 = torch.constant.int 7
%int25_2963 = torch.constant.int 25
%int64_2964 = torch.constant.int 64
%3756 = torch.prim.ListConstruct %int1_2961, %int7_2962, %int25_2963, %int64_2964 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3757 = torch.aten.reshape %3754#0, %3756 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2965 = torch.constant.int 1
%int2_2966 = torch.constant.int 2
%3758 = torch.aten.transpose.int %3757, %int1_2965, %int2_2966 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3759 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2967 = torch.constant.int 1
%int7_2968 = torch.constant.int 7
%int25_2969 = torch.constant.int 25
%int64_2970 = torch.constant.int 64
%3760 = torch.prim.ListConstruct %int1_2967, %int7_2968, %int25_2969, %int64_2970 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3761 = torch.aten.reshape %3754#1, %3760 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2971 = torch.constant.int 1
%int2_2972 = torch.constant.int 2
%3762 = torch.aten.transpose.int %3761, %int1_2971, %int2_2972 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3763 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_2973 = torch.constant.int 1
%int7_2974 = torch.constant.int 7
%int25_2975 = torch.constant.int 25
%int64_2976 = torch.constant.int 64
%3764 = torch.prim.ListConstruct %int1_2973, %int7_2974, %int25_2975, %int64_2976 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3765 = torch.aten.reshape %3754#2, %3764 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_2977 = torch.constant.int 1
%int2_2978 = torch.constant.int 2
%3766 = torch.aten.transpose.int %3765, %int1_2977, %int2_2978 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_2979 = torch.constant.int 1
%int2_2980 = torch.constant.int 2
%3767 = torch.aten.transpose.int %3761, %int1_2979, %int2_2980 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_2981 = torch.constant.int 2
%int3_2982 = torch.constant.int 3
%3768 = torch.aten.transpose.int %3767, %int2_2981, %int3_2982 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3769 = torch.aten.matmul %3758, %3768 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3770 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3771 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3772 = torch.aten.pow.Tensor_Tensor %3770, %3771 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3773 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_2983 = torch.constant.int 0
%3774 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_2984 = torch.constant.none
%float0.000000e00_2985 = torch.constant.float 0.000000e+00
%3775 = torch.aten.full %3774, %float0.000000e00_2985, %none_2984, %none_2984, %none_2984, %none_2984 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_2986 = torch.constant.int 1
%3776 = torch.aten.add.Tensor %3775, %3772, %int1_2986 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3777 = torch.aten.div.Tensor %3769, %3776 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3778 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_2987 = torch.constant.int 6
%none_2988 = torch.constant.none
%false_2989 = torch.constant.bool false
%3779 = torch.aten.to.dtype %3777, %int6_2987, %false_2989, %false_2989, %none_2988 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3780 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3781 = torch.aten.where.self %3778, %3779, %3780 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_2990 = torch.constant.int 3
%none_2991 = torch.constant.none
%3782 = torch.aten.softmax.int %3781, %int3_2990, %none_2991 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_2992 = torch.constant.int 6
%none_2993 = torch.constant.none
%false_2994 = torch.constant.bool false
%3783 = torch.aten.to.dtype %3782, %int6_2992, %false_2994, %false_2994, %none_2993 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3784 = torch.aten.matmul %3783, %3766 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_2995 = torch.constant.int 1
%int2_2996 = torch.constant.int 2
%3785 = torch.aten.transpose.int %3784, %int1_2995, %int2_2996 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3786 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_2997 = torch.constant.int 1
%int7_2998 = torch.constant.int 7
%int1600_2999 = torch.constant.int 1600
%3787 = torch.prim.ListConstruct %int1_2997, %int7_2998, %int1600_2999 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3788 = torch.aten.reshape %3785, %3787 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3789 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3000 = torch.constant.int 7
%int1600_3001 = torch.constant.int 1600
%3790 = torch.prim.ListConstruct %int7_3000, %int1600_3001 : (!torch.int, !torch.int) -> !torch.list<int>
%3791 = torch.aten.reshape %3788, %3790 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3002 = torch.constant.int 0
%int1_3003 = torch.constant.int 1
%3792 = torch.aten.mm %3791, %438 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3793 = torch.aten.add.Tensor %3792, %439, %int1_3003 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3794 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3004 = torch.constant.int 1
%int7_3005 = torch.constant.int 7
%int1600_3006 = torch.constant.int 1600
%3795 = torch.prim.ListConstruct %int1_3004, %int7_3005, %int1600_3006 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3796 = torch.aten.reshape %3793, %3795 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3007 = torch.constant.int 1
%3797 = torch.aten.add.Tensor %3796, %3741, %int1_3007 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3008 = torch.constant.float 9.9999997473787516E-6
%int1600_3009 = torch.constant.int 1600
%3798 = torch.prim.ListConstruct %int1600_3009 : (!torch.int) -> !torch.list<int>
%result0_3010, %result1_3011, %result2_3012 = torch.aten.native_layer_norm %3797, %3798, %440, %441, %float9.999990e-06_3008 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3799 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3013 = torch.constant.int 7
%int1600_3014 = torch.constant.int 1600
%3800 = torch.prim.ListConstruct %int7_3013, %int1600_3014 : (!torch.int, !torch.int) -> !torch.list<int>
%3801 = torch.aten.reshape %result0_3010, %3800 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3015 = torch.constant.int 0
%int1_3016 = torch.constant.int 1
%3802 = torch.aten.mm %3801, %442 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3803 = torch.aten.add.Tensor %3802, %443, %int1_3016 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3804 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3017 = torch.constant.int 1
%int7_3018 = torch.constant.int 7
%int6400_3019 = torch.constant.int 6400
%3805 = torch.prim.ListConstruct %int1_3017, %int7_3018, %int6400_3019 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3806 = torch.aten.reshape %3803, %3805 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3807 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3808 = torch.aten.mul.Tensor %3806, %3807 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3809 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3810 = torch.aten.pow.Tensor_Tensor %3806, %3809 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3811 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3812 = torch.aten.mul.Tensor %3810, %3811 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3020 = torch.constant.int 1
%3813 = torch.aten.add.Tensor %3806, %3812, %int1_3020 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3814 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3815 = torch.aten.mul.Tensor %3813, %3814 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3816 = torch.aten.tanh %3815 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3817 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3021 = torch.constant.int 1
%3818 = torch.aten.add.Tensor %3816, %3817, %int1_3021 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3819 = torch.aten.mul.Tensor %3808, %3818 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3820 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3022 = torch.constant.int 7
%int6400_3023 = torch.constant.int 6400
%3821 = torch.prim.ListConstruct %int7_3022, %int6400_3023 : (!torch.int, !torch.int) -> !torch.list<int>
%3822 = torch.aten.reshape %3819, %3821 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3024 = torch.constant.int 0
%int1_3025 = torch.constant.int 1
%3823 = torch.aten.mm %3822, %444 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3824 = torch.aten.add.Tensor %3823, %445, %int1_3025 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3825 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3026 = torch.constant.int 1
%int7_3027 = torch.constant.int 7
%int1600_3028 = torch.constant.int 1600
%3826 = torch.prim.ListConstruct %int1_3026, %int7_3027, %int1600_3028 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3827 = torch.aten.reshape %3824, %3826 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3029 = torch.constant.int 1
%3828 = torch.aten.add.Tensor %3797, %3827, %int1_3029 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3030 = torch.constant.float 9.9999997473787516E-6
%int1600_3031 = torch.constant.int 1600
%3829 = torch.prim.ListConstruct %int1600_3031 : (!torch.int) -> !torch.list<int>
%result0_3032, %result1_3033, %result2_3034 = torch.aten.native_layer_norm %3828, %3829, %446, %447, %float9.999990e-06_3030 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3830 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3035 = torch.constant.int 7
%int1600_3036 = torch.constant.int 1600
%3831 = torch.prim.ListConstruct %int7_3035, %int1600_3036 : (!torch.int, !torch.int) -> !torch.list<int>
%3832 = torch.aten.reshape %result0_3032, %3831 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3037 = torch.constant.int 0
%int1_3038 = torch.constant.int 1
%3833 = torch.aten.mm %3832, %448 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3834 = torch.aten.add.Tensor %3833, %449, %int1_3038 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3835 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3039 = torch.constant.int 1
%int7_3040 = torch.constant.int 7
%int4800_3041 = torch.constant.int 4800
%3836 = torch.prim.ListConstruct %int1_3039, %int7_3040, %int4800_3041 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3837 = torch.aten.reshape %3834, %3836 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3838 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3839 = torch.prim.tolist(%3838) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3042 = torch.constant.int 2
%3840 = torch.aten.split_with_sizes %3837, %3839, %int2_3042 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3841:3 = torch.prim.ListUnpack %3840 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3842 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3043 = torch.constant.int 1
%int7_3044 = torch.constant.int 7
%int25_3045 = torch.constant.int 25
%int64_3046 = torch.constant.int 64
%3843 = torch.prim.ListConstruct %int1_3043, %int7_3044, %int25_3045, %int64_3046 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3844 = torch.aten.reshape %3841#0, %3843 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3047 = torch.constant.int 1
%int2_3048 = torch.constant.int 2
%3845 = torch.aten.transpose.int %3844, %int1_3047, %int2_3048 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3846 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3049 = torch.constant.int 1
%int7_3050 = torch.constant.int 7
%int25_3051 = torch.constant.int 25
%int64_3052 = torch.constant.int 64
%3847 = torch.prim.ListConstruct %int1_3049, %int7_3050, %int25_3051, %int64_3052 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3848 = torch.aten.reshape %3841#1, %3847 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3053 = torch.constant.int 1
%int2_3054 = torch.constant.int 2
%3849 = torch.aten.transpose.int %3848, %int1_3053, %int2_3054 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3850 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3055 = torch.constant.int 1
%int7_3056 = torch.constant.int 7
%int25_3057 = torch.constant.int 25
%int64_3058 = torch.constant.int 64
%3851 = torch.prim.ListConstruct %int1_3055, %int7_3056, %int25_3057, %int64_3058 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3852 = torch.aten.reshape %3841#2, %3851 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3059 = torch.constant.int 1
%int2_3060 = torch.constant.int 2
%3853 = torch.aten.transpose.int %3852, %int1_3059, %int2_3060 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3061 = torch.constant.int 1
%int2_3062 = torch.constant.int 2
%3854 = torch.aten.transpose.int %3848, %int1_3061, %int2_3062 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3063 = torch.constant.int 2
%int3_3064 = torch.constant.int 3
%3855 = torch.aten.transpose.int %3854, %int2_3063, %int3_3064 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3856 = torch.aten.matmul %3845, %3855 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3857 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3858 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3859 = torch.aten.pow.Tensor_Tensor %3857, %3858 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3860 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3065 = torch.constant.int 0
%3861 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3066 = torch.constant.none
%float0.000000e00_3067 = torch.constant.float 0.000000e+00
%3862 = torch.aten.full %3861, %float0.000000e00_3067, %none_3066, %none_3066, %none_3066, %none_3066 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3068 = torch.constant.int 1
%3863 = torch.aten.add.Tensor %3862, %3859, %int1_3068 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3864 = torch.aten.div.Tensor %3856, %3863 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3865 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3069 = torch.constant.int 6
%none_3070 = torch.constant.none
%false_3071 = torch.constant.bool false
%3866 = torch.aten.to.dtype %3864, %int6_3069, %false_3071, %false_3071, %none_3070 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3867 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3868 = torch.aten.where.self %3865, %3866, %3867 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3072 = torch.constant.int 3
%none_3073 = torch.constant.none
%3869 = torch.aten.softmax.int %3868, %int3_3072, %none_3073 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3074 = torch.constant.int 6
%none_3075 = torch.constant.none
%false_3076 = torch.constant.bool false
%3870 = torch.aten.to.dtype %3869, %int6_3074, %false_3076, %false_3076, %none_3075 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3871 = torch.aten.matmul %3870, %3853 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3077 = torch.constant.int 1
%int2_3078 = torch.constant.int 2
%3872 = torch.aten.transpose.int %3871, %int1_3077, %int2_3078 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3873 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3079 = torch.constant.int 1
%int7_3080 = torch.constant.int 7
%int1600_3081 = torch.constant.int 1600
%3874 = torch.prim.ListConstruct %int1_3079, %int7_3080, %int1600_3081 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3875 = torch.aten.reshape %3872, %3874 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3876 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3082 = torch.constant.int 7
%int1600_3083 = torch.constant.int 1600
%3877 = torch.prim.ListConstruct %int7_3082, %int1600_3083 : (!torch.int, !torch.int) -> !torch.list<int>
%3878 = torch.aten.reshape %3875, %3877 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3084 = torch.constant.int 0
%int1_3085 = torch.constant.int 1
%3879 = torch.aten.mm %3878, %450 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3880 = torch.aten.add.Tensor %3879, %451, %int1_3085 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3881 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3086 = torch.constant.int 1
%int7_3087 = torch.constant.int 7
%int1600_3088 = torch.constant.int 1600
%3882 = torch.prim.ListConstruct %int1_3086, %int7_3087, %int1600_3088 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3883 = torch.aten.reshape %3880, %3882 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3089 = torch.constant.int 1
%3884 = torch.aten.add.Tensor %3883, %3828, %int1_3089 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3090 = torch.constant.float 9.9999997473787516E-6
%int1600_3091 = torch.constant.int 1600
%3885 = torch.prim.ListConstruct %int1600_3091 : (!torch.int) -> !torch.list<int>
%result0_3092, %result1_3093, %result2_3094 = torch.aten.native_layer_norm %3884, %3885, %452, %453, %float9.999990e-06_3090 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3886 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3095 = torch.constant.int 7
%int1600_3096 = torch.constant.int 1600
%3887 = torch.prim.ListConstruct %int7_3095, %int1600_3096 : (!torch.int, !torch.int) -> !torch.list<int>
%3888 = torch.aten.reshape %result0_3092, %3887 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3097 = torch.constant.int 0
%int1_3098 = torch.constant.int 1
%3889 = torch.aten.mm %3888, %454 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3890 = torch.aten.add.Tensor %3889, %455, %int1_3098 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3891 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3099 = torch.constant.int 1
%int7_3100 = torch.constant.int 7
%int6400_3101 = torch.constant.int 6400
%3892 = torch.prim.ListConstruct %int1_3099, %int7_3100, %int6400_3101 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3893 = torch.aten.reshape %3890, %3892 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3894 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3895 = torch.aten.mul.Tensor %3893, %3894 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3896 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3897 = torch.aten.pow.Tensor_Tensor %3893, %3896 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3898 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3899 = torch.aten.mul.Tensor %3897, %3898 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3102 = torch.constant.int 1
%3900 = torch.aten.add.Tensor %3893, %3899, %int1_3102 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3901 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3902 = torch.aten.mul.Tensor %3900, %3901 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3903 = torch.aten.tanh %3902 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3904 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3103 = torch.constant.int 1
%3905 = torch.aten.add.Tensor %3903, %3904, %int1_3103 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3906 = torch.aten.mul.Tensor %3895, %3905 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3907 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3104 = torch.constant.int 7
%int6400_3105 = torch.constant.int 6400
%3908 = torch.prim.ListConstruct %int7_3104, %int6400_3105 : (!torch.int, !torch.int) -> !torch.list<int>
%3909 = torch.aten.reshape %3906, %3908 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3106 = torch.constant.int 0
%int1_3107 = torch.constant.int 1
%3910 = torch.aten.mm %3909, %456 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3911 = torch.aten.add.Tensor %3910, %457, %int1_3107 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3912 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3108 = torch.constant.int 1
%int7_3109 = torch.constant.int 7
%int1600_3110 = torch.constant.int 1600
%3913 = torch.prim.ListConstruct %int1_3108, %int7_3109, %int1600_3110 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3914 = torch.aten.reshape %3911, %3913 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3111 = torch.constant.int 1
%3915 = torch.aten.add.Tensor %3884, %3914, %int1_3111 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3112 = torch.constant.float 9.9999997473787516E-6
%int1600_3113 = torch.constant.int 1600
%3916 = torch.prim.ListConstruct %int1600_3113 : (!torch.int) -> !torch.list<int>
%result0_3114, %result1_3115, %result2_3116 = torch.aten.native_layer_norm %3915, %3916, %458, %459, %float9.999990e-06_3112 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3917 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3117 = torch.constant.int 7
%int1600_3118 = torch.constant.int 1600
%3918 = torch.prim.ListConstruct %int7_3117, %int1600_3118 : (!torch.int, !torch.int) -> !torch.list<int>
%3919 = torch.aten.reshape %result0_3114, %3918 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3119 = torch.constant.int 0
%int1_3120 = torch.constant.int 1
%3920 = torch.aten.mm %3919, %460 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%3921 = torch.aten.add.Tensor %3920, %461, %int1_3120 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%3922 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3121 = torch.constant.int 1
%int7_3122 = torch.constant.int 7
%int4800_3123 = torch.constant.int 4800
%3923 = torch.prim.ListConstruct %int1_3121, %int7_3122, %int4800_3123 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3924 = torch.aten.reshape %3921, %3923 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%3925 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%3926 = torch.prim.tolist(%3925) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3124 = torch.constant.int 2
%3927 = torch.aten.split_with_sizes %3924, %3926, %int2_3124 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%3928:3 = torch.prim.ListUnpack %3927 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%3929 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3125 = torch.constant.int 1
%int7_3126 = torch.constant.int 7
%int25_3127 = torch.constant.int 25
%int64_3128 = torch.constant.int 64
%3930 = torch.prim.ListConstruct %int1_3125, %int7_3126, %int25_3127, %int64_3128 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3931 = torch.aten.reshape %3928#0, %3930 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3129 = torch.constant.int 1
%int2_3130 = torch.constant.int 2
%3932 = torch.aten.transpose.int %3931, %int1_3129, %int2_3130 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3933 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3131 = torch.constant.int 1
%int7_3132 = torch.constant.int 7
%int25_3133 = torch.constant.int 25
%int64_3134 = torch.constant.int 64
%3934 = torch.prim.ListConstruct %int1_3131, %int7_3132, %int25_3133, %int64_3134 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3935 = torch.aten.reshape %3928#1, %3934 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3135 = torch.constant.int 1
%int2_3136 = torch.constant.int 2
%3936 = torch.aten.transpose.int %3935, %int1_3135, %int2_3136 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%3937 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3137 = torch.constant.int 1
%int7_3138 = torch.constant.int 7
%int25_3139 = torch.constant.int 25
%int64_3140 = torch.constant.int 64
%3938 = torch.prim.ListConstruct %int1_3137, %int7_3138, %int25_3139, %int64_3140 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3939 = torch.aten.reshape %3928#2, %3938 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3141 = torch.constant.int 1
%int2_3142 = torch.constant.int 2
%3940 = torch.aten.transpose.int %3939, %int1_3141, %int2_3142 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3143 = torch.constant.int 1
%int2_3144 = torch.constant.int 2
%3941 = torch.aten.transpose.int %3935, %int1_3143, %int2_3144 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3145 = torch.constant.int 2
%int3_3146 = torch.constant.int 3
%3942 = torch.aten.transpose.int %3941, %int2_3145, %int3_3146 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%3943 = torch.aten.matmul %3932, %3942 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3944 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%3945 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3946 = torch.aten.pow.Tensor_Tensor %3944, %3945 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%3947 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3147 = torch.constant.int 0
%3948 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3148 = torch.constant.none
%float0.000000e00_3149 = torch.constant.float 0.000000e+00
%3949 = torch.aten.full %3948, %float0.000000e00_3149, %none_3148, %none_3148, %none_3148, %none_3148 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3150 = torch.constant.int 1
%3950 = torch.aten.add.Tensor %3949, %3946, %int1_3150 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%3951 = torch.aten.div.Tensor %3943, %3950 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%3952 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3151 = torch.constant.int 6
%none_3152 = torch.constant.none
%false_3153 = torch.constant.bool false
%3953 = torch.aten.to.dtype %3951, %int6_3151, %false_3153, %false_3153, %none_3152 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3954 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%3955 = torch.aten.where.self %3952, %3953, %3954 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3154 = torch.constant.int 3
%none_3155 = torch.constant.none
%3956 = torch.aten.softmax.int %3955, %int3_3154, %none_3155 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3156 = torch.constant.int 6
%none_3157 = torch.constant.none
%false_3158 = torch.constant.bool false
%3957 = torch.aten.to.dtype %3956, %int6_3156, %false_3158, %false_3158, %none_3157 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%3958 = torch.aten.matmul %3957, %3940 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3159 = torch.constant.int 1
%int2_3160 = torch.constant.int 2
%3959 = torch.aten.transpose.int %3958, %int1_3159, %int2_3160 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%3960 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3161 = torch.constant.int 1
%int7_3162 = torch.constant.int 7
%int1600_3163 = torch.constant.int 1600
%3961 = torch.prim.ListConstruct %int1_3161, %int7_3162, %int1600_3163 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3962 = torch.aten.reshape %3959, %3961 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%3963 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3164 = torch.constant.int 7
%int1600_3165 = torch.constant.int 1600
%3964 = torch.prim.ListConstruct %int7_3164, %int1600_3165 : (!torch.int, !torch.int) -> !torch.list<int>
%3965 = torch.aten.reshape %3962, %3964 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3166 = torch.constant.int 0
%int1_3167 = torch.constant.int 1
%3966 = torch.aten.mm %3965, %462 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3967 = torch.aten.add.Tensor %3966, %463, %int1_3167 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3968 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3168 = torch.constant.int 1
%int7_3169 = torch.constant.int 7
%int1600_3170 = torch.constant.int 1600
%3969 = torch.prim.ListConstruct %int1_3168, %int7_3169, %int1600_3170 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3970 = torch.aten.reshape %3967, %3969 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3171 = torch.constant.int 1
%3971 = torch.aten.add.Tensor %3970, %3915, %int1_3171 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3172 = torch.constant.float 9.9999997473787516E-6
%int1600_3173 = torch.constant.int 1600
%3972 = torch.prim.ListConstruct %int1600_3173 : (!torch.int) -> !torch.list<int>
%result0_3174, %result1_3175, %result2_3176 = torch.aten.native_layer_norm %3971, %3972, %464, %465, %float9.999990e-06_3172 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%3973 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3177 = torch.constant.int 7
%int1600_3178 = torch.constant.int 1600
%3974 = torch.prim.ListConstruct %int7_3177, %int1600_3178 : (!torch.int, !torch.int) -> !torch.list<int>
%3975 = torch.aten.reshape %result0_3174, %3974 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3179 = torch.constant.int 0
%int1_3180 = torch.constant.int 1
%3976 = torch.aten.mm %3975, %466 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%3977 = torch.aten.add.Tensor %3976, %467, %int1_3180 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%3978 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3181 = torch.constant.int 1
%int7_3182 = torch.constant.int 7
%int6400_3183 = torch.constant.int 6400
%3979 = torch.prim.ListConstruct %int1_3181, %int7_3182, %int6400_3183 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%3980 = torch.aten.reshape %3977, %3979 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%3981 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%3982 = torch.aten.mul.Tensor %3980, %3981 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3983 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%3984 = torch.aten.pow.Tensor_Tensor %3980, %3983 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3985 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%3986 = torch.aten.mul.Tensor %3984, %3985 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3184 = torch.constant.int 1
%3987 = torch.aten.add.Tensor %3980, %3986, %int1_3184 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3988 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%3989 = torch.aten.mul.Tensor %3987, %3988 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%3990 = torch.aten.tanh %3989 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3991 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3185 = torch.constant.int 1
%3992 = torch.aten.add.Tensor %3990, %3991, %int1_3185 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%3993 = torch.aten.mul.Tensor %3982, %3992 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%3994 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3186 = torch.constant.int 7
%int6400_3187 = torch.constant.int 6400
%3995 = torch.prim.ListConstruct %int7_3186, %int6400_3187 : (!torch.int, !torch.int) -> !torch.list<int>
%3996 = torch.aten.reshape %3993, %3995 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3188 = torch.constant.int 0
%int1_3189 = torch.constant.int 1
%3997 = torch.aten.mm %3996, %468 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%3998 = torch.aten.add.Tensor %3997, %469, %int1_3189 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%3999 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3190 = torch.constant.int 1
%int7_3191 = torch.constant.int 7
%int1600_3192 = torch.constant.int 1600
%4000 = torch.prim.ListConstruct %int1_3190, %int7_3191, %int1600_3192 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4001 = torch.aten.reshape %3998, %4000 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3193 = torch.constant.int 1
%4002 = torch.aten.add.Tensor %3971, %4001, %int1_3193 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3194 = torch.constant.float 9.9999997473787516E-6
%int1600_3195 = torch.constant.int 1600
%4003 = torch.prim.ListConstruct %int1600_3195 : (!torch.int) -> !torch.list<int>
%result0_3196, %result1_3197, %result2_3198 = torch.aten.native_layer_norm %4002, %4003, %470, %471, %float9.999990e-06_3194 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4004 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3199 = torch.constant.int 7
%int1600_3200 = torch.constant.int 1600
%4005 = torch.prim.ListConstruct %int7_3199, %int1600_3200 : (!torch.int, !torch.int) -> !torch.list<int>
%4006 = torch.aten.reshape %result0_3196, %4005 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3201 = torch.constant.int 0
%int1_3202 = torch.constant.int 1
%4007 = torch.aten.mm %4006, %472 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%4008 = torch.aten.add.Tensor %4007, %473, %int1_3202 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%4009 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3203 = torch.constant.int 1
%int7_3204 = torch.constant.int 7
%int4800_3205 = torch.constant.int 4800
%4010 = torch.prim.ListConstruct %int1_3203, %int7_3204, %int4800_3205 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4011 = torch.aten.reshape %4008, %4010 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%4012 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%4013 = torch.prim.tolist(%4012) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3206 = torch.constant.int 2
%4014 = torch.aten.split_with_sizes %4011, %4013, %int2_3206 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%4015:3 = torch.prim.ListUnpack %4014 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%4016 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3207 = torch.constant.int 1
%int7_3208 = torch.constant.int 7
%int25_3209 = torch.constant.int 25
%int64_3210 = torch.constant.int 64
%4017 = torch.prim.ListConstruct %int1_3207, %int7_3208, %int25_3209, %int64_3210 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4018 = torch.aten.reshape %4015#0, %4017 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3211 = torch.constant.int 1
%int2_3212 = torch.constant.int 2
%4019 = torch.aten.transpose.int %4018, %int1_3211, %int2_3212 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4020 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3213 = torch.constant.int 1
%int7_3214 = torch.constant.int 7
%int25_3215 = torch.constant.int 25
%int64_3216 = torch.constant.int 64
%4021 = torch.prim.ListConstruct %int1_3213, %int7_3214, %int25_3215, %int64_3216 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4022 = torch.aten.reshape %4015#1, %4021 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3217 = torch.constant.int 1
%int2_3218 = torch.constant.int 2
%4023 = torch.aten.transpose.int %4022, %int1_3217, %int2_3218 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4024 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3219 = torch.constant.int 1
%int7_3220 = torch.constant.int 7
%int25_3221 = torch.constant.int 25
%int64_3222 = torch.constant.int 64
%4025 = torch.prim.ListConstruct %int1_3219, %int7_3220, %int25_3221, %int64_3222 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4026 = torch.aten.reshape %4015#2, %4025 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3223 = torch.constant.int 1
%int2_3224 = torch.constant.int 2
%4027 = torch.aten.transpose.int %4026, %int1_3223, %int2_3224 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3225 = torch.constant.int 1
%int2_3226 = torch.constant.int 2
%4028 = torch.aten.transpose.int %4022, %int1_3225, %int2_3226 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3227 = torch.constant.int 2
%int3_3228 = torch.constant.int 3
%4029 = torch.aten.transpose.int %4028, %int2_3227, %int3_3228 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%4030 = torch.aten.matmul %4019, %4029 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4031 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%4032 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4033 = torch.aten.pow.Tensor_Tensor %4031, %4032 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%4034 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3229 = torch.constant.int 0
%4035 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3230 = torch.constant.none
%float0.000000e00_3231 = torch.constant.float 0.000000e+00
%4036 = torch.aten.full %4035, %float0.000000e00_3231, %none_3230, %none_3230, %none_3230, %none_3230 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3232 = torch.constant.int 1
%4037 = torch.aten.add.Tensor %4036, %4033, %int1_3232 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%4038 = torch.aten.div.Tensor %4030, %4037 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4039 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3233 = torch.constant.int 6
%none_3234 = torch.constant.none
%false_3235 = torch.constant.bool false
%4040 = torch.aten.to.dtype %4038, %int6_3233, %false_3235, %false_3235, %none_3234 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4041 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%4042 = torch.aten.where.self %4039, %4040, %4041 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3236 = torch.constant.int 3
%none_3237 = torch.constant.none
%4043 = torch.aten.softmax.int %4042, %int3_3236, %none_3237 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3238 = torch.constant.int 6
%none_3239 = torch.constant.none
%false_3240 = torch.constant.bool false
%4044 = torch.aten.to.dtype %4043, %int6_3238, %false_3240, %false_3240, %none_3239 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4045 = torch.aten.matmul %4044, %4027 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3241 = torch.constant.int 1
%int2_3242 = torch.constant.int 2
%4046 = torch.aten.transpose.int %4045, %int1_3241, %int2_3242 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%4047 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3243 = torch.constant.int 1
%int7_3244 = torch.constant.int 7
%int1600_3245 = torch.constant.int 1600
%4048 = torch.prim.ListConstruct %int1_3243, %int7_3244, %int1600_3245 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4049 = torch.aten.reshape %4046, %4048 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4050 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3246 = torch.constant.int 7
%int1600_3247 = torch.constant.int 1600
%4051 = torch.prim.ListConstruct %int7_3246, %int1600_3247 : (!torch.int, !torch.int) -> !torch.list<int>
%4052 = torch.aten.reshape %4049, %4051 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3248 = torch.constant.int 0
%int1_3249 = torch.constant.int 1
%4053 = torch.aten.mm %4052, %474 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4054 = torch.aten.add.Tensor %4053, %475, %int1_3249 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4055 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3250 = torch.constant.int 1
%int7_3251 = torch.constant.int 7
%int1600_3252 = torch.constant.int 1600
%4056 = torch.prim.ListConstruct %int1_3250, %int7_3251, %int1600_3252 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4057 = torch.aten.reshape %4054, %4056 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3253 = torch.constant.int 1
%4058 = torch.aten.add.Tensor %4057, %4002, %int1_3253 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3254 = torch.constant.float 9.9999997473787516E-6
%int1600_3255 = torch.constant.int 1600
%4059 = torch.prim.ListConstruct %int1600_3255 : (!torch.int) -> !torch.list<int>
%result0_3256, %result1_3257, %result2_3258 = torch.aten.native_layer_norm %4058, %4059, %476, %477, %float9.999990e-06_3254 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4060 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3259 = torch.constant.int 7
%int1600_3260 = torch.constant.int 1600
%4061 = torch.prim.ListConstruct %int7_3259, %int1600_3260 : (!torch.int, !torch.int) -> !torch.list<int>
%4062 = torch.aten.reshape %result0_3256, %4061 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3261 = torch.constant.int 0
%int1_3262 = torch.constant.int 1
%4063 = torch.aten.mm %4062, %478 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%4064 = torch.aten.add.Tensor %4063, %479, %int1_3262 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%4065 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3263 = torch.constant.int 1
%int7_3264 = torch.constant.int 7
%int6400_3265 = torch.constant.int 6400
%4066 = torch.prim.ListConstruct %int1_3263, %int7_3264, %int6400_3265 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4067 = torch.aten.reshape %4064, %4066 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%4068 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4069 = torch.aten.mul.Tensor %4067, %4068 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4070 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%4071 = torch.aten.pow.Tensor_Tensor %4067, %4070 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4072 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%4073 = torch.aten.mul.Tensor %4071, %4072 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3266 = torch.constant.int 1
%4074 = torch.aten.add.Tensor %4067, %4073, %int1_3266 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4075 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%4076 = torch.aten.mul.Tensor %4074, %4075 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4077 = torch.aten.tanh %4076 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4078 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3267 = torch.constant.int 1
%4079 = torch.aten.add.Tensor %4077, %4078, %int1_3267 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4080 = torch.aten.mul.Tensor %4069, %4079 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4081 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3268 = torch.constant.int 7
%int6400_3269 = torch.constant.int 6400
%4082 = torch.prim.ListConstruct %int7_3268, %int6400_3269 : (!torch.int, !torch.int) -> !torch.list<int>
%4083 = torch.aten.reshape %4080, %4082 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3270 = torch.constant.int 0
%int1_3271 = torch.constant.int 1
%4084 = torch.aten.mm %4083, %480 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4085 = torch.aten.add.Tensor %4084, %481, %int1_3271 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4086 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3272 = torch.constant.int 1
%int7_3273 = torch.constant.int 7
%int1600_3274 = torch.constant.int 1600
%4087 = torch.prim.ListConstruct %int1_3272, %int7_3273, %int1600_3274 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4088 = torch.aten.reshape %4085, %4087 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3275 = torch.constant.int 1
%4089 = torch.aten.add.Tensor %4058, %4088, %int1_3275 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3276 = torch.constant.float 9.9999997473787516E-6
%int1600_3277 = torch.constant.int 1600
%4090 = torch.prim.ListConstruct %int1600_3277 : (!torch.int) -> !torch.list<int>
%result0_3278, %result1_3279, %result2_3280 = torch.aten.native_layer_norm %4089, %4090, %482, %483, %float9.999990e-06_3276 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4091 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3281 = torch.constant.int 7
%int1600_3282 = torch.constant.int 1600
%4092 = torch.prim.ListConstruct %int7_3281, %int1600_3282 : (!torch.int, !torch.int) -> !torch.list<int>
%4093 = torch.aten.reshape %result0_3278, %4092 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3283 = torch.constant.int 0
%int1_3284 = torch.constant.int 1
%4094 = torch.aten.mm %4093, %484 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%4095 = torch.aten.add.Tensor %4094, %485, %int1_3284 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%4096 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3285 = torch.constant.int 1
%int7_3286 = torch.constant.int 7
%int4800_3287 = torch.constant.int 4800
%4097 = torch.prim.ListConstruct %int1_3285, %int7_3286, %int4800_3287 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4098 = torch.aten.reshape %4095, %4097 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%4099 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%4100 = torch.prim.tolist(%4099) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3288 = torch.constant.int 2
%4101 = torch.aten.split_with_sizes %4098, %4100, %int2_3288 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%4102:3 = torch.prim.ListUnpack %4101 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%4103 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3289 = torch.constant.int 1
%int7_3290 = torch.constant.int 7
%int25_3291 = torch.constant.int 25
%int64_3292 = torch.constant.int 64
%4104 = torch.prim.ListConstruct %int1_3289, %int7_3290, %int25_3291, %int64_3292 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4105 = torch.aten.reshape %4102#0, %4104 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3293 = torch.constant.int 1
%int2_3294 = torch.constant.int 2
%4106 = torch.aten.transpose.int %4105, %int1_3293, %int2_3294 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4107 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3295 = torch.constant.int 1
%int7_3296 = torch.constant.int 7
%int25_3297 = torch.constant.int 25
%int64_3298 = torch.constant.int 64
%4108 = torch.prim.ListConstruct %int1_3295, %int7_3296, %int25_3297, %int64_3298 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4109 = torch.aten.reshape %4102#1, %4108 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3299 = torch.constant.int 1
%int2_3300 = torch.constant.int 2
%4110 = torch.aten.transpose.int %4109, %int1_3299, %int2_3300 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4111 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3301 = torch.constant.int 1
%int7_3302 = torch.constant.int 7
%int25_3303 = torch.constant.int 25
%int64_3304 = torch.constant.int 64
%4112 = torch.prim.ListConstruct %int1_3301, %int7_3302, %int25_3303, %int64_3304 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4113 = torch.aten.reshape %4102#2, %4112 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3305 = torch.constant.int 1
%int2_3306 = torch.constant.int 2
%4114 = torch.aten.transpose.int %4113, %int1_3305, %int2_3306 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3307 = torch.constant.int 1
%int2_3308 = torch.constant.int 2
%4115 = torch.aten.transpose.int %4109, %int1_3307, %int2_3308 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3309 = torch.constant.int 2
%int3_3310 = torch.constant.int 3
%4116 = torch.aten.transpose.int %4115, %int2_3309, %int3_3310 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%4117 = torch.aten.matmul %4106, %4116 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4118 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%4119 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4120 = torch.aten.pow.Tensor_Tensor %4118, %4119 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%4121 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3311 = torch.constant.int 0
%4122 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3312 = torch.constant.none
%float0.000000e00_3313 = torch.constant.float 0.000000e+00
%4123 = torch.aten.full %4122, %float0.000000e00_3313, %none_3312, %none_3312, %none_3312, %none_3312 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3314 = torch.constant.int 1
%4124 = torch.aten.add.Tensor %4123, %4120, %int1_3314 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%4125 = torch.aten.div.Tensor %4117, %4124 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4126 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3315 = torch.constant.int 6
%none_3316 = torch.constant.none
%false_3317 = torch.constant.bool false
%4127 = torch.aten.to.dtype %4125, %int6_3315, %false_3317, %false_3317, %none_3316 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4128 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%4129 = torch.aten.where.self %4126, %4127, %4128 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3318 = torch.constant.int 3
%none_3319 = torch.constant.none
%4130 = torch.aten.softmax.int %4129, %int3_3318, %none_3319 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3320 = torch.constant.int 6
%none_3321 = torch.constant.none
%false_3322 = torch.constant.bool false
%4131 = torch.aten.to.dtype %4130, %int6_3320, %false_3322, %false_3322, %none_3321 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4132 = torch.aten.matmul %4131, %4114 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3323 = torch.constant.int 1
%int2_3324 = torch.constant.int 2
%4133 = torch.aten.transpose.int %4132, %int1_3323, %int2_3324 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%4134 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3325 = torch.constant.int 1
%int7_3326 = torch.constant.int 7
%int1600_3327 = torch.constant.int 1600
%4135 = torch.prim.ListConstruct %int1_3325, %int7_3326, %int1600_3327 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4136 = torch.aten.reshape %4133, %4135 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4137 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3328 = torch.constant.int 7
%int1600_3329 = torch.constant.int 1600
%4138 = torch.prim.ListConstruct %int7_3328, %int1600_3329 : (!torch.int, !torch.int) -> !torch.list<int>
%4139 = torch.aten.reshape %4136, %4138 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3330 = torch.constant.int 0
%int1_3331 = torch.constant.int 1
%4140 = torch.aten.mm %4139, %486 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4141 = torch.aten.add.Tensor %4140, %487, %int1_3331 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4142 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3332 = torch.constant.int 1
%int7_3333 = torch.constant.int 7
%int1600_3334 = torch.constant.int 1600
%4143 = torch.prim.ListConstruct %int1_3332, %int7_3333, %int1600_3334 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4144 = torch.aten.reshape %4141, %4143 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3335 = torch.constant.int 1
%4145 = torch.aten.add.Tensor %4144, %4089, %int1_3335 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3336 = torch.constant.float 9.9999997473787516E-6
%int1600_3337 = torch.constant.int 1600
%4146 = torch.prim.ListConstruct %int1600_3337 : (!torch.int) -> !torch.list<int>
%result0_3338, %result1_3339, %result2_3340 = torch.aten.native_layer_norm %4145, %4146, %488, %489, %float9.999990e-06_3336 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4147 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3341 = torch.constant.int 7
%int1600_3342 = torch.constant.int 1600
%4148 = torch.prim.ListConstruct %int7_3341, %int1600_3342 : (!torch.int, !torch.int) -> !torch.list<int>
%4149 = torch.aten.reshape %result0_3338, %4148 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3343 = torch.constant.int 0
%int1_3344 = torch.constant.int 1
%4150 = torch.aten.mm %4149, %490 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%4151 = torch.aten.add.Tensor %4150, %491, %int1_3344 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%4152 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3345 = torch.constant.int 1
%int7_3346 = torch.constant.int 7
%int6400_3347 = torch.constant.int 6400
%4153 = torch.prim.ListConstruct %int1_3345, %int7_3346, %int6400_3347 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4154 = torch.aten.reshape %4151, %4153 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%4155 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4156 = torch.aten.mul.Tensor %4154, %4155 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4157 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%4158 = torch.aten.pow.Tensor_Tensor %4154, %4157 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4159 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%4160 = torch.aten.mul.Tensor %4158, %4159 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3348 = torch.constant.int 1
%4161 = torch.aten.add.Tensor %4154, %4160, %int1_3348 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4162 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%4163 = torch.aten.mul.Tensor %4161, %4162 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4164 = torch.aten.tanh %4163 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4165 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3349 = torch.constant.int 1
%4166 = torch.aten.add.Tensor %4164, %4165, %int1_3349 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4167 = torch.aten.mul.Tensor %4156, %4166 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4168 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3350 = torch.constant.int 7
%int6400_3351 = torch.constant.int 6400
%4169 = torch.prim.ListConstruct %int7_3350, %int6400_3351 : (!torch.int, !torch.int) -> !torch.list<int>
%4170 = torch.aten.reshape %4167, %4169 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3352 = torch.constant.int 0
%int1_3353 = torch.constant.int 1
%4171 = torch.aten.mm %4170, %492 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4172 = torch.aten.add.Tensor %4171, %493, %int1_3353 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4173 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3354 = torch.constant.int 1
%int7_3355 = torch.constant.int 7
%int1600_3356 = torch.constant.int 1600
%4174 = torch.prim.ListConstruct %int1_3354, %int7_3355, %int1600_3356 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4175 = torch.aten.reshape %4172, %4174 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3357 = torch.constant.int 1
%4176 = torch.aten.add.Tensor %4145, %4175, %int1_3357 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3358 = torch.constant.float 9.9999997473787516E-6
%int1600_3359 = torch.constant.int 1600
%4177 = torch.prim.ListConstruct %int1600_3359 : (!torch.int) -> !torch.list<int>
%result0_3360, %result1_3361, %result2_3362 = torch.aten.native_layer_norm %4176, %4177, %494, %495, %float9.999990e-06_3358 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4178 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3363 = torch.constant.int 7
%int1600_3364 = torch.constant.int 1600
%4179 = torch.prim.ListConstruct %int7_3363, %int1600_3364 : (!torch.int, !torch.int) -> !torch.list<int>
%4180 = torch.aten.reshape %result0_3360, %4179 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3365 = torch.constant.int 0
%int1_3366 = torch.constant.int 1
%4181 = torch.aten.mm %4180, %496 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%4182 = torch.aten.add.Tensor %4181, %497, %int1_3366 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%4183 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3367 = torch.constant.int 1
%int7_3368 = torch.constant.int 7
%int4800_3369 = torch.constant.int 4800
%4184 = torch.prim.ListConstruct %int1_3367, %int7_3368, %int4800_3369 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4185 = torch.aten.reshape %4182, %4184 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%4186 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%4187 = torch.prim.tolist(%4186) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3370 = torch.constant.int 2
%4188 = torch.aten.split_with_sizes %4185, %4187, %int2_3370 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%4189:3 = torch.prim.ListUnpack %4188 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%4190 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3371 = torch.constant.int 1
%int7_3372 = torch.constant.int 7
%int25_3373 = torch.constant.int 25
%int64_3374 = torch.constant.int 64
%4191 = torch.prim.ListConstruct %int1_3371, %int7_3372, %int25_3373, %int64_3374 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4192 = torch.aten.reshape %4189#0, %4191 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3375 = torch.constant.int 1
%int2_3376 = torch.constant.int 2
%4193 = torch.aten.transpose.int %4192, %int1_3375, %int2_3376 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4194 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3377 = torch.constant.int 1
%int7_3378 = torch.constant.int 7
%int25_3379 = torch.constant.int 25
%int64_3380 = torch.constant.int 64
%4195 = torch.prim.ListConstruct %int1_3377, %int7_3378, %int25_3379, %int64_3380 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4196 = torch.aten.reshape %4189#1, %4195 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3381 = torch.constant.int 1
%int2_3382 = torch.constant.int 2
%4197 = torch.aten.transpose.int %4196, %int1_3381, %int2_3382 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4198 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3383 = torch.constant.int 1
%int7_3384 = torch.constant.int 7
%int25_3385 = torch.constant.int 25
%int64_3386 = torch.constant.int 64
%4199 = torch.prim.ListConstruct %int1_3383, %int7_3384, %int25_3385, %int64_3386 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4200 = torch.aten.reshape %4189#2, %4199 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3387 = torch.constant.int 1
%int2_3388 = torch.constant.int 2
%4201 = torch.aten.transpose.int %4200, %int1_3387, %int2_3388 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3389 = torch.constant.int 1
%int2_3390 = torch.constant.int 2
%4202 = torch.aten.transpose.int %4196, %int1_3389, %int2_3390 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3391 = torch.constant.int 2
%int3_3392 = torch.constant.int 3
%4203 = torch.aten.transpose.int %4202, %int2_3391, %int3_3392 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%4204 = torch.aten.matmul %4193, %4203 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4205 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%4206 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4207 = torch.aten.pow.Tensor_Tensor %4205, %4206 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%4208 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3393 = torch.constant.int 0
%4209 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3394 = torch.constant.none
%float0.000000e00_3395 = torch.constant.float 0.000000e+00
%4210 = torch.aten.full %4209, %float0.000000e00_3395, %none_3394, %none_3394, %none_3394, %none_3394 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3396 = torch.constant.int 1
%4211 = torch.aten.add.Tensor %4210, %4207, %int1_3396 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%4212 = torch.aten.div.Tensor %4204, %4211 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4213 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3397 = torch.constant.int 6
%none_3398 = torch.constant.none
%false_3399 = torch.constant.bool false
%4214 = torch.aten.to.dtype %4212, %int6_3397, %false_3399, %false_3399, %none_3398 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4215 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%4216 = torch.aten.where.self %4213, %4214, %4215 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3400 = torch.constant.int 3
%none_3401 = torch.constant.none
%4217 = torch.aten.softmax.int %4216, %int3_3400, %none_3401 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3402 = torch.constant.int 6
%none_3403 = torch.constant.none
%false_3404 = torch.constant.bool false
%4218 = torch.aten.to.dtype %4217, %int6_3402, %false_3404, %false_3404, %none_3403 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4219 = torch.aten.matmul %4218, %4201 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3405 = torch.constant.int 1
%int2_3406 = torch.constant.int 2
%4220 = torch.aten.transpose.int %4219, %int1_3405, %int2_3406 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%4221 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3407 = torch.constant.int 1
%int7_3408 = torch.constant.int 7
%int1600_3409 = torch.constant.int 1600
%4222 = torch.prim.ListConstruct %int1_3407, %int7_3408, %int1600_3409 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4223 = torch.aten.reshape %4220, %4222 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4224 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3410 = torch.constant.int 7
%int1600_3411 = torch.constant.int 1600
%4225 = torch.prim.ListConstruct %int7_3410, %int1600_3411 : (!torch.int, !torch.int) -> !torch.list<int>
%4226 = torch.aten.reshape %4223, %4225 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3412 = torch.constant.int 0
%int1_3413 = torch.constant.int 1
%4227 = torch.aten.mm %4226, %498 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4228 = torch.aten.add.Tensor %4227, %499, %int1_3413 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4229 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3414 = torch.constant.int 1
%int7_3415 = torch.constant.int 7
%int1600_3416 = torch.constant.int 1600
%4230 = torch.prim.ListConstruct %int1_3414, %int7_3415, %int1600_3416 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4231 = torch.aten.reshape %4228, %4230 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3417 = torch.constant.int 1
%4232 = torch.aten.add.Tensor %4231, %4176, %int1_3417 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3418 = torch.constant.float 9.9999997473787516E-6
%int1600_3419 = torch.constant.int 1600
%4233 = torch.prim.ListConstruct %int1600_3419 : (!torch.int) -> !torch.list<int>
%result0_3420, %result1_3421, %result2_3422 = torch.aten.native_layer_norm %4232, %4233, %500, %501, %float9.999990e-06_3418 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4234 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3423 = torch.constant.int 7
%int1600_3424 = torch.constant.int 1600
%4235 = torch.prim.ListConstruct %int7_3423, %int1600_3424 : (!torch.int, !torch.int) -> !torch.list<int>
%4236 = torch.aten.reshape %result0_3420, %4235 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3425 = torch.constant.int 0
%int1_3426 = torch.constant.int 1
%4237 = torch.aten.mm %4236, %502 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%4238 = torch.aten.add.Tensor %4237, %503, %int1_3426 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%4239 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3427 = torch.constant.int 1
%int7_3428 = torch.constant.int 7
%int6400_3429 = torch.constant.int 6400
%4240 = torch.prim.ListConstruct %int1_3427, %int7_3428, %int6400_3429 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4241 = torch.aten.reshape %4238, %4240 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%4242 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4243 = torch.aten.mul.Tensor %4241, %4242 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4244 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%4245 = torch.aten.pow.Tensor_Tensor %4241, %4244 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4246 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%4247 = torch.aten.mul.Tensor %4245, %4246 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3430 = torch.constant.int 1
%4248 = torch.aten.add.Tensor %4241, %4247, %int1_3430 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4249 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%4250 = torch.aten.mul.Tensor %4248, %4249 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4251 = torch.aten.tanh %4250 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4252 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3431 = torch.constant.int 1
%4253 = torch.aten.add.Tensor %4251, %4252, %int1_3431 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4254 = torch.aten.mul.Tensor %4243, %4253 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4255 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3432 = torch.constant.int 7
%int6400_3433 = torch.constant.int 6400
%4256 = torch.prim.ListConstruct %int7_3432, %int6400_3433 : (!torch.int, !torch.int) -> !torch.list<int>
%4257 = torch.aten.reshape %4254, %4256 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3434 = torch.constant.int 0
%int1_3435 = torch.constant.int 1
%4258 = torch.aten.mm %4257, %504 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4259 = torch.aten.add.Tensor %4258, %505, %int1_3435 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4260 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3436 = torch.constant.int 1
%int7_3437 = torch.constant.int 7
%int1600_3438 = torch.constant.int 1600
%4261 = torch.prim.ListConstruct %int1_3436, %int7_3437, %int1600_3438 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4262 = torch.aten.reshape %4259, %4261 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3439 = torch.constant.int 1
%4263 = torch.aten.add.Tensor %4232, %4262, %int1_3439 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3440 = torch.constant.float 9.9999997473787516E-6
%int1600_3441 = torch.constant.int 1600
%4264 = torch.prim.ListConstruct %int1600_3441 : (!torch.int) -> !torch.list<int>
%result0_3442, %result1_3443, %result2_3444 = torch.aten.native_layer_norm %4263, %4264, %506, %507, %float9.999990e-06_3440 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4265 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3445 = torch.constant.int 7
%int1600_3446 = torch.constant.int 1600
%4266 = torch.prim.ListConstruct %int7_3445, %int1600_3446 : (!torch.int, !torch.int) -> !torch.list<int>
%4267 = torch.aten.reshape %result0_3442, %4266 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3447 = torch.constant.int 0
%int1_3448 = torch.constant.int 1
%4268 = torch.aten.mm %4267, %508 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%4269 = torch.aten.add.Tensor %4268, %509, %int1_3448 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%4270 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3449 = torch.constant.int 1
%int7_3450 = torch.constant.int 7
%int4800_3451 = torch.constant.int 4800
%4271 = torch.prim.ListConstruct %int1_3449, %int7_3450, %int4800_3451 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4272 = torch.aten.reshape %4269, %4271 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%4273 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%4274 = torch.prim.tolist(%4273) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3452 = torch.constant.int 2
%4275 = torch.aten.split_with_sizes %4272, %4274, %int2_3452 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%4276:3 = torch.prim.ListUnpack %4275 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%4277 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3453 = torch.constant.int 1
%int7_3454 = torch.constant.int 7
%int25_3455 = torch.constant.int 25
%int64_3456 = torch.constant.int 64
%4278 = torch.prim.ListConstruct %int1_3453, %int7_3454, %int25_3455, %int64_3456 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4279 = torch.aten.reshape %4276#0, %4278 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3457 = torch.constant.int 1
%int2_3458 = torch.constant.int 2
%4280 = torch.aten.transpose.int %4279, %int1_3457, %int2_3458 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4281 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3459 = torch.constant.int 1
%int7_3460 = torch.constant.int 7
%int25_3461 = torch.constant.int 25
%int64_3462 = torch.constant.int 64
%4282 = torch.prim.ListConstruct %int1_3459, %int7_3460, %int25_3461, %int64_3462 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4283 = torch.aten.reshape %4276#1, %4282 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3463 = torch.constant.int 1
%int2_3464 = torch.constant.int 2
%4284 = torch.aten.transpose.int %4283, %int1_3463, %int2_3464 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4285 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3465 = torch.constant.int 1
%int7_3466 = torch.constant.int 7
%int25_3467 = torch.constant.int 25
%int64_3468 = torch.constant.int 64
%4286 = torch.prim.ListConstruct %int1_3465, %int7_3466, %int25_3467, %int64_3468 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4287 = torch.aten.reshape %4276#2, %4286 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3469 = torch.constant.int 1
%int2_3470 = torch.constant.int 2
%4288 = torch.aten.transpose.int %4287, %int1_3469, %int2_3470 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3471 = torch.constant.int 1
%int2_3472 = torch.constant.int 2
%4289 = torch.aten.transpose.int %4283, %int1_3471, %int2_3472 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3473 = torch.constant.int 2
%int3_3474 = torch.constant.int 3
%4290 = torch.aten.transpose.int %4289, %int2_3473, %int3_3474 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%4291 = torch.aten.matmul %4280, %4290 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4292 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%4293 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4294 = torch.aten.pow.Tensor_Tensor %4292, %4293 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%4295 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3475 = torch.constant.int 0
%4296 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3476 = torch.constant.none
%float0.000000e00_3477 = torch.constant.float 0.000000e+00
%4297 = torch.aten.full %4296, %float0.000000e00_3477, %none_3476, %none_3476, %none_3476, %none_3476 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3478 = torch.constant.int 1
%4298 = torch.aten.add.Tensor %4297, %4294, %int1_3478 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%4299 = torch.aten.div.Tensor %4291, %4298 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4300 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3479 = torch.constant.int 6
%none_3480 = torch.constant.none
%false_3481 = torch.constant.bool false
%4301 = torch.aten.to.dtype %4299, %int6_3479, %false_3481, %false_3481, %none_3480 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4302 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%4303 = torch.aten.where.self %4300, %4301, %4302 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3482 = torch.constant.int 3
%none_3483 = torch.constant.none
%4304 = torch.aten.softmax.int %4303, %int3_3482, %none_3483 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3484 = torch.constant.int 6
%none_3485 = torch.constant.none
%false_3486 = torch.constant.bool false
%4305 = torch.aten.to.dtype %4304, %int6_3484, %false_3486, %false_3486, %none_3485 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4306 = torch.aten.matmul %4305, %4288 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3487 = torch.constant.int 1
%int2_3488 = torch.constant.int 2
%4307 = torch.aten.transpose.int %4306, %int1_3487, %int2_3488 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%4308 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3489 = torch.constant.int 1
%int7_3490 = torch.constant.int 7
%int1600_3491 = torch.constant.int 1600
%4309 = torch.prim.ListConstruct %int1_3489, %int7_3490, %int1600_3491 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4310 = torch.aten.reshape %4307, %4309 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4311 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3492 = torch.constant.int 7
%int1600_3493 = torch.constant.int 1600
%4312 = torch.prim.ListConstruct %int7_3492, %int1600_3493 : (!torch.int, !torch.int) -> !torch.list<int>
%4313 = torch.aten.reshape %4310, %4312 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3494 = torch.constant.int 0
%int1_3495 = torch.constant.int 1
%4314 = torch.aten.mm %4313, %510 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4315 = torch.aten.add.Tensor %4314, %511, %int1_3495 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4316 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3496 = torch.constant.int 1
%int7_3497 = torch.constant.int 7
%int1600_3498 = torch.constant.int 1600
%4317 = torch.prim.ListConstruct %int1_3496, %int7_3497, %int1600_3498 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4318 = torch.aten.reshape %4315, %4317 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3499 = torch.constant.int 1
%4319 = torch.aten.add.Tensor %4318, %4263, %int1_3499 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3500 = torch.constant.float 9.9999997473787516E-6
%int1600_3501 = torch.constant.int 1600
%4320 = torch.prim.ListConstruct %int1600_3501 : (!torch.int) -> !torch.list<int>
%result0_3502, %result1_3503, %result2_3504 = torch.aten.native_layer_norm %4319, %4320, %512, %513, %float9.999990e-06_3500 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4321 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3505 = torch.constant.int 7
%int1600_3506 = torch.constant.int 1600
%4322 = torch.prim.ListConstruct %int7_3505, %int1600_3506 : (!torch.int, !torch.int) -> !torch.list<int>
%4323 = torch.aten.reshape %result0_3502, %4322 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3507 = torch.constant.int 0
%int1_3508 = torch.constant.int 1
%4324 = torch.aten.mm %4323, %514 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%4325 = torch.aten.add.Tensor %4324, %515, %int1_3508 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%4326 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3509 = torch.constant.int 1
%int7_3510 = torch.constant.int 7
%int6400_3511 = torch.constant.int 6400
%4327 = torch.prim.ListConstruct %int1_3509, %int7_3510, %int6400_3511 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4328 = torch.aten.reshape %4325, %4327 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%4329 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4330 = torch.aten.mul.Tensor %4328, %4329 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4331 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%4332 = torch.aten.pow.Tensor_Tensor %4328, %4331 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4333 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%4334 = torch.aten.mul.Tensor %4332, %4333 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3512 = torch.constant.int 1
%4335 = torch.aten.add.Tensor %4328, %4334, %int1_3512 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4336 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%4337 = torch.aten.mul.Tensor %4335, %4336 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4338 = torch.aten.tanh %4337 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4339 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3513 = torch.constant.int 1
%4340 = torch.aten.add.Tensor %4338, %4339, %int1_3513 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4341 = torch.aten.mul.Tensor %4330, %4340 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4342 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3514 = torch.constant.int 7
%int6400_3515 = torch.constant.int 6400
%4343 = torch.prim.ListConstruct %int7_3514, %int6400_3515 : (!torch.int, !torch.int) -> !torch.list<int>
%4344 = torch.aten.reshape %4341, %4343 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3516 = torch.constant.int 0
%int1_3517 = torch.constant.int 1
%4345 = torch.aten.mm %4344, %516 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4346 = torch.aten.add.Tensor %4345, %517, %int1_3517 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4347 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3518 = torch.constant.int 1
%int7_3519 = torch.constant.int 7
%int1600_3520 = torch.constant.int 1600
%4348 = torch.prim.ListConstruct %int1_3518, %int7_3519, %int1600_3520 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4349 = torch.aten.reshape %4346, %4348 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3521 = torch.constant.int 1
%4350 = torch.aten.add.Tensor %4319, %4349, %int1_3521 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3522 = torch.constant.float 9.9999997473787516E-6
%int1600_3523 = torch.constant.int 1600
%4351 = torch.prim.ListConstruct %int1600_3523 : (!torch.int) -> !torch.list<int>
%result0_3524, %result1_3525, %result2_3526 = torch.aten.native_layer_norm %4350, %4351, %518, %519, %float9.999990e-06_3522 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4352 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3527 = torch.constant.int 7
%int1600_3528 = torch.constant.int 1600
%4353 = torch.prim.ListConstruct %int7_3527, %int1600_3528 : (!torch.int, !torch.int) -> !torch.list<int>
%4354 = torch.aten.reshape %result0_3524, %4353 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3529 = torch.constant.int 0
%int1_3530 = torch.constant.int 1
%4355 = torch.aten.mm %4354, %520 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%4356 = torch.aten.add.Tensor %4355, %521, %int1_3530 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%4357 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3531 = torch.constant.int 1
%int7_3532 = torch.constant.int 7
%int4800_3533 = torch.constant.int 4800
%4358 = torch.prim.ListConstruct %int1_3531, %int7_3532, %int4800_3533 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4359 = torch.aten.reshape %4356, %4358 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%4360 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%4361 = torch.prim.tolist(%4360) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3534 = torch.constant.int 2
%4362 = torch.aten.split_with_sizes %4359, %4361, %int2_3534 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%4363:3 = torch.prim.ListUnpack %4362 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%4364 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3535 = torch.constant.int 1
%int7_3536 = torch.constant.int 7
%int25_3537 = torch.constant.int 25
%int64_3538 = torch.constant.int 64
%4365 = torch.prim.ListConstruct %int1_3535, %int7_3536, %int25_3537, %int64_3538 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4366 = torch.aten.reshape %4363#0, %4365 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3539 = torch.constant.int 1
%int2_3540 = torch.constant.int 2
%4367 = torch.aten.transpose.int %4366, %int1_3539, %int2_3540 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4368 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3541 = torch.constant.int 1
%int7_3542 = torch.constant.int 7
%int25_3543 = torch.constant.int 25
%int64_3544 = torch.constant.int 64
%4369 = torch.prim.ListConstruct %int1_3541, %int7_3542, %int25_3543, %int64_3544 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4370 = torch.aten.reshape %4363#1, %4369 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3545 = torch.constant.int 1
%int2_3546 = torch.constant.int 2
%4371 = torch.aten.transpose.int %4370, %int1_3545, %int2_3546 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4372 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3547 = torch.constant.int 1
%int7_3548 = torch.constant.int 7
%int25_3549 = torch.constant.int 25
%int64_3550 = torch.constant.int 64
%4373 = torch.prim.ListConstruct %int1_3547, %int7_3548, %int25_3549, %int64_3550 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4374 = torch.aten.reshape %4363#2, %4373 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3551 = torch.constant.int 1
%int2_3552 = torch.constant.int 2
%4375 = torch.aten.transpose.int %4374, %int1_3551, %int2_3552 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3553 = torch.constant.int 1
%int2_3554 = torch.constant.int 2
%4376 = torch.aten.transpose.int %4370, %int1_3553, %int2_3554 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3555 = torch.constant.int 2
%int3_3556 = torch.constant.int 3
%4377 = torch.aten.transpose.int %4376, %int2_3555, %int3_3556 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%4378 = torch.aten.matmul %4367, %4377 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4379 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%4380 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4381 = torch.aten.pow.Tensor_Tensor %4379, %4380 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%4382 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3557 = torch.constant.int 0
%4383 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3558 = torch.constant.none
%float0.000000e00_3559 = torch.constant.float 0.000000e+00
%4384 = torch.aten.full %4383, %float0.000000e00_3559, %none_3558, %none_3558, %none_3558, %none_3558 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3560 = torch.constant.int 1
%4385 = torch.aten.add.Tensor %4384, %4381, %int1_3560 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%4386 = torch.aten.div.Tensor %4378, %4385 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4387 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3561 = torch.constant.int 6
%none_3562 = torch.constant.none
%false_3563 = torch.constant.bool false
%4388 = torch.aten.to.dtype %4386, %int6_3561, %false_3563, %false_3563, %none_3562 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4389 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%4390 = torch.aten.where.self %4387, %4388, %4389 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3564 = torch.constant.int 3
%none_3565 = torch.constant.none
%4391 = torch.aten.softmax.int %4390, %int3_3564, %none_3565 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3566 = torch.constant.int 6
%none_3567 = torch.constant.none
%false_3568 = torch.constant.bool false
%4392 = torch.aten.to.dtype %4391, %int6_3566, %false_3568, %false_3568, %none_3567 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4393 = torch.aten.matmul %4392, %4375 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3569 = torch.constant.int 1
%int2_3570 = torch.constant.int 2
%4394 = torch.aten.transpose.int %4393, %int1_3569, %int2_3570 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%4395 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3571 = torch.constant.int 1
%int7_3572 = torch.constant.int 7
%int1600_3573 = torch.constant.int 1600
%4396 = torch.prim.ListConstruct %int1_3571, %int7_3572, %int1600_3573 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4397 = torch.aten.reshape %4394, %4396 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4398 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3574 = torch.constant.int 7
%int1600_3575 = torch.constant.int 1600
%4399 = torch.prim.ListConstruct %int7_3574, %int1600_3575 : (!torch.int, !torch.int) -> !torch.list<int>
%4400 = torch.aten.reshape %4397, %4399 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3576 = torch.constant.int 0
%int1_3577 = torch.constant.int 1
%4401 = torch.aten.mm %4400, %522 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4402 = torch.aten.add.Tensor %4401, %523, %int1_3577 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4403 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3578 = torch.constant.int 1
%int7_3579 = torch.constant.int 7
%int1600_3580 = torch.constant.int 1600
%4404 = torch.prim.ListConstruct %int1_3578, %int7_3579, %int1600_3580 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4405 = torch.aten.reshape %4402, %4404 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3581 = torch.constant.int 1
%4406 = torch.aten.add.Tensor %4405, %4350, %int1_3581 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3582 = torch.constant.float 9.9999997473787516E-6
%int1600_3583 = torch.constant.int 1600
%4407 = torch.prim.ListConstruct %int1600_3583 : (!torch.int) -> !torch.list<int>
%result0_3584, %result1_3585, %result2_3586 = torch.aten.native_layer_norm %4406, %4407, %524, %525, %float9.999990e-06_3582 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4408 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3587 = torch.constant.int 7
%int1600_3588 = torch.constant.int 1600
%4409 = torch.prim.ListConstruct %int7_3587, %int1600_3588 : (!torch.int, !torch.int) -> !torch.list<int>
%4410 = torch.aten.reshape %result0_3584, %4409 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3589 = torch.constant.int 0
%int1_3590 = torch.constant.int 1
%4411 = torch.aten.mm %4410, %526 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%4412 = torch.aten.add.Tensor %4411, %527, %int1_3590 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%4413 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3591 = torch.constant.int 1
%int7_3592 = torch.constant.int 7
%int6400_3593 = torch.constant.int 6400
%4414 = torch.prim.ListConstruct %int1_3591, %int7_3592, %int6400_3593 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4415 = torch.aten.reshape %4412, %4414 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%4416 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4417 = torch.aten.mul.Tensor %4415, %4416 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4418 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%4419 = torch.aten.pow.Tensor_Tensor %4415, %4418 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4420 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%4421 = torch.aten.mul.Tensor %4419, %4420 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3594 = torch.constant.int 1
%4422 = torch.aten.add.Tensor %4415, %4421, %int1_3594 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4423 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%4424 = torch.aten.mul.Tensor %4422, %4423 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4425 = torch.aten.tanh %4424 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4426 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3595 = torch.constant.int 1
%4427 = torch.aten.add.Tensor %4425, %4426, %int1_3595 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4428 = torch.aten.mul.Tensor %4417, %4427 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4429 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3596 = torch.constant.int 7
%int6400_3597 = torch.constant.int 6400
%4430 = torch.prim.ListConstruct %int7_3596, %int6400_3597 : (!torch.int, !torch.int) -> !torch.list<int>
%4431 = torch.aten.reshape %4428, %4430 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3598 = torch.constant.int 0
%int1_3599 = torch.constant.int 1
%4432 = torch.aten.mm %4431, %528 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4433 = torch.aten.add.Tensor %4432, %529, %int1_3599 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4434 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3600 = torch.constant.int 1
%int7_3601 = torch.constant.int 7
%int1600_3602 = torch.constant.int 1600
%4435 = torch.prim.ListConstruct %int1_3600, %int7_3601, %int1600_3602 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4436 = torch.aten.reshape %4433, %4435 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3603 = torch.constant.int 1
%4437 = torch.aten.add.Tensor %4406, %4436, %int1_3603 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3604 = torch.constant.float 9.9999997473787516E-6
%int1600_3605 = torch.constant.int 1600
%4438 = torch.prim.ListConstruct %int1600_3605 : (!torch.int) -> !torch.list<int>
%result0_3606, %result1_3607, %result2_3608 = torch.aten.native_layer_norm %4437, %4438, %530, %531, %float9.999990e-06_3604 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4439 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3609 = torch.constant.int 7
%int1600_3610 = torch.constant.int 1600
%4440 = torch.prim.ListConstruct %int7_3609, %int1600_3610 : (!torch.int, !torch.int) -> !torch.list<int>
%4441 = torch.aten.reshape %result0_3606, %4440 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3611 = torch.constant.int 0
%int1_3612 = torch.constant.int 1
%4442 = torch.aten.mm %4441, %532 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%4443 = torch.aten.add.Tensor %4442, %533, %int1_3612 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%4444 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3613 = torch.constant.int 1
%int7_3614 = torch.constant.int 7
%int4800_3615 = torch.constant.int 4800
%4445 = torch.prim.ListConstruct %int1_3613, %int7_3614, %int4800_3615 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4446 = torch.aten.reshape %4443, %4445 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%4447 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%4448 = torch.prim.tolist(%4447) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3616 = torch.constant.int 2
%4449 = torch.aten.split_with_sizes %4446, %4448, %int2_3616 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%4450:3 = torch.prim.ListUnpack %4449 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%4451 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3617 = torch.constant.int 1
%int7_3618 = torch.constant.int 7
%int25_3619 = torch.constant.int 25
%int64_3620 = torch.constant.int 64
%4452 = torch.prim.ListConstruct %int1_3617, %int7_3618, %int25_3619, %int64_3620 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4453 = torch.aten.reshape %4450#0, %4452 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3621 = torch.constant.int 1
%int2_3622 = torch.constant.int 2
%4454 = torch.aten.transpose.int %4453, %int1_3621, %int2_3622 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4455 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3623 = torch.constant.int 1
%int7_3624 = torch.constant.int 7
%int25_3625 = torch.constant.int 25
%int64_3626 = torch.constant.int 64
%4456 = torch.prim.ListConstruct %int1_3623, %int7_3624, %int25_3625, %int64_3626 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4457 = torch.aten.reshape %4450#1, %4456 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3627 = torch.constant.int 1
%int2_3628 = torch.constant.int 2
%4458 = torch.aten.transpose.int %4457, %int1_3627, %int2_3628 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4459 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3629 = torch.constant.int 1
%int7_3630 = torch.constant.int 7
%int25_3631 = torch.constant.int 25
%int64_3632 = torch.constant.int 64
%4460 = torch.prim.ListConstruct %int1_3629, %int7_3630, %int25_3631, %int64_3632 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4461 = torch.aten.reshape %4450#2, %4460 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3633 = torch.constant.int 1
%int2_3634 = torch.constant.int 2
%4462 = torch.aten.transpose.int %4461, %int1_3633, %int2_3634 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3635 = torch.constant.int 1
%int2_3636 = torch.constant.int 2
%4463 = torch.aten.transpose.int %4457, %int1_3635, %int2_3636 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3637 = torch.constant.int 2
%int3_3638 = torch.constant.int 3
%4464 = torch.aten.transpose.int %4463, %int2_3637, %int3_3638 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%4465 = torch.aten.matmul %4454, %4464 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4466 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%4467 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4468 = torch.aten.pow.Tensor_Tensor %4466, %4467 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%4469 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3639 = torch.constant.int 0
%4470 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3640 = torch.constant.none
%float0.000000e00_3641 = torch.constant.float 0.000000e+00
%4471 = torch.aten.full %4470, %float0.000000e00_3641, %none_3640, %none_3640, %none_3640, %none_3640 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3642 = torch.constant.int 1
%4472 = torch.aten.add.Tensor %4471, %4468, %int1_3642 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%4473 = torch.aten.div.Tensor %4465, %4472 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4474 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3643 = torch.constant.int 6
%none_3644 = torch.constant.none
%false_3645 = torch.constant.bool false
%4475 = torch.aten.to.dtype %4473, %int6_3643, %false_3645, %false_3645, %none_3644 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4476 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%4477 = torch.aten.where.self %4474, %4475, %4476 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3646 = torch.constant.int 3
%none_3647 = torch.constant.none
%4478 = torch.aten.softmax.int %4477, %int3_3646, %none_3647 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3648 = torch.constant.int 6
%none_3649 = torch.constant.none
%false_3650 = torch.constant.bool false
%4479 = torch.aten.to.dtype %4478, %int6_3648, %false_3650, %false_3650, %none_3649 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4480 = torch.aten.matmul %4479, %4462 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3651 = torch.constant.int 1
%int2_3652 = torch.constant.int 2
%4481 = torch.aten.transpose.int %4480, %int1_3651, %int2_3652 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%4482 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3653 = torch.constant.int 1
%int7_3654 = torch.constant.int 7
%int1600_3655 = torch.constant.int 1600
%4483 = torch.prim.ListConstruct %int1_3653, %int7_3654, %int1600_3655 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4484 = torch.aten.reshape %4481, %4483 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4485 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3656 = torch.constant.int 7
%int1600_3657 = torch.constant.int 1600
%4486 = torch.prim.ListConstruct %int7_3656, %int1600_3657 : (!torch.int, !torch.int) -> !torch.list<int>
%4487 = torch.aten.reshape %4484, %4486 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3658 = torch.constant.int 0
%int1_3659 = torch.constant.int 1
%4488 = torch.aten.mm %4487, %534 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4489 = torch.aten.add.Tensor %4488, %535, %int1_3659 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4490 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3660 = torch.constant.int 1
%int7_3661 = torch.constant.int 7
%int1600_3662 = torch.constant.int 1600
%4491 = torch.prim.ListConstruct %int1_3660, %int7_3661, %int1600_3662 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4492 = torch.aten.reshape %4489, %4491 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3663 = torch.constant.int 1
%4493 = torch.aten.add.Tensor %4492, %4437, %int1_3663 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3664 = torch.constant.float 9.9999997473787516E-6
%int1600_3665 = torch.constant.int 1600
%4494 = torch.prim.ListConstruct %int1600_3665 : (!torch.int) -> !torch.list<int>
%result0_3666, %result1_3667, %result2_3668 = torch.aten.native_layer_norm %4493, %4494, %536, %537, %float9.999990e-06_3664 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4495 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3669 = torch.constant.int 7
%int1600_3670 = torch.constant.int 1600
%4496 = torch.prim.ListConstruct %int7_3669, %int1600_3670 : (!torch.int, !torch.int) -> !torch.list<int>
%4497 = torch.aten.reshape %result0_3666, %4496 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3671 = torch.constant.int 0
%int1_3672 = torch.constant.int 1
%4498 = torch.aten.mm %4497, %538 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%4499 = torch.aten.add.Tensor %4498, %539, %int1_3672 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%4500 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3673 = torch.constant.int 1
%int7_3674 = torch.constant.int 7
%int6400_3675 = torch.constant.int 6400
%4501 = torch.prim.ListConstruct %int1_3673, %int7_3674, %int6400_3675 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4502 = torch.aten.reshape %4499, %4501 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%4503 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4504 = torch.aten.mul.Tensor %4502, %4503 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4505 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%4506 = torch.aten.pow.Tensor_Tensor %4502, %4505 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4507 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%4508 = torch.aten.mul.Tensor %4506, %4507 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3676 = torch.constant.int 1
%4509 = torch.aten.add.Tensor %4502, %4508, %int1_3676 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4510 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%4511 = torch.aten.mul.Tensor %4509, %4510 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4512 = torch.aten.tanh %4511 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4513 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3677 = torch.constant.int 1
%4514 = torch.aten.add.Tensor %4512, %4513, %int1_3677 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4515 = torch.aten.mul.Tensor %4504, %4514 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4516 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3678 = torch.constant.int 7
%int6400_3679 = torch.constant.int 6400
%4517 = torch.prim.ListConstruct %int7_3678, %int6400_3679 : (!torch.int, !torch.int) -> !torch.list<int>
%4518 = torch.aten.reshape %4515, %4517 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3680 = torch.constant.int 0
%int1_3681 = torch.constant.int 1
%4519 = torch.aten.mm %4518, %540 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4520 = torch.aten.add.Tensor %4519, %541, %int1_3681 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4521 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3682 = torch.constant.int 1
%int7_3683 = torch.constant.int 7
%int1600_3684 = torch.constant.int 1600
%4522 = torch.prim.ListConstruct %int1_3682, %int7_3683, %int1600_3684 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4523 = torch.aten.reshape %4520, %4522 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3685 = torch.constant.int 1
%4524 = torch.aten.add.Tensor %4493, %4523, %int1_3685 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3686 = torch.constant.float 9.9999997473787516E-6
%int1600_3687 = torch.constant.int 1600
%4525 = torch.prim.ListConstruct %int1600_3687 : (!torch.int) -> !torch.list<int>
%result0_3688, %result1_3689, %result2_3690 = torch.aten.native_layer_norm %4524, %4525, %542, %543, %float9.999990e-06_3686 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4526 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3691 = torch.constant.int 7
%int1600_3692 = torch.constant.int 1600
%4527 = torch.prim.ListConstruct %int7_3691, %int1600_3692 : (!torch.int, !torch.int) -> !torch.list<int>
%4528 = torch.aten.reshape %result0_3688, %4527 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3693 = torch.constant.int 0
%int1_3694 = torch.constant.int 1
%4529 = torch.aten.mm %4528, %544 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%4530 = torch.aten.add.Tensor %4529, %545, %int1_3694 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%4531 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3695 = torch.constant.int 1
%int7_3696 = torch.constant.int 7
%int4800_3697 = torch.constant.int 4800
%4532 = torch.prim.ListConstruct %int1_3695, %int7_3696, %int4800_3697 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4533 = torch.aten.reshape %4530, %4532 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%4534 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%4535 = torch.prim.tolist(%4534) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3698 = torch.constant.int 2
%4536 = torch.aten.split_with_sizes %4533, %4535, %int2_3698 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%4537:3 = torch.prim.ListUnpack %4536 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%4538 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3699 = torch.constant.int 1
%int7_3700 = torch.constant.int 7
%int25_3701 = torch.constant.int 25
%int64_3702 = torch.constant.int 64
%4539 = torch.prim.ListConstruct %int1_3699, %int7_3700, %int25_3701, %int64_3702 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4540 = torch.aten.reshape %4537#0, %4539 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3703 = torch.constant.int 1
%int2_3704 = torch.constant.int 2
%4541 = torch.aten.transpose.int %4540, %int1_3703, %int2_3704 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4542 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3705 = torch.constant.int 1
%int7_3706 = torch.constant.int 7
%int25_3707 = torch.constant.int 25
%int64_3708 = torch.constant.int 64
%4543 = torch.prim.ListConstruct %int1_3705, %int7_3706, %int25_3707, %int64_3708 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4544 = torch.aten.reshape %4537#1, %4543 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3709 = torch.constant.int 1
%int2_3710 = torch.constant.int 2
%4545 = torch.aten.transpose.int %4544, %int1_3709, %int2_3710 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4546 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3711 = torch.constant.int 1
%int7_3712 = torch.constant.int 7
%int25_3713 = torch.constant.int 25
%int64_3714 = torch.constant.int 64
%4547 = torch.prim.ListConstruct %int1_3711, %int7_3712, %int25_3713, %int64_3714 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4548 = torch.aten.reshape %4537#2, %4547 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3715 = torch.constant.int 1
%int2_3716 = torch.constant.int 2
%4549 = torch.aten.transpose.int %4548, %int1_3715, %int2_3716 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3717 = torch.constant.int 1
%int2_3718 = torch.constant.int 2
%4550 = torch.aten.transpose.int %4544, %int1_3717, %int2_3718 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3719 = torch.constant.int 2
%int3_3720 = torch.constant.int 3
%4551 = torch.aten.transpose.int %4550, %int2_3719, %int3_3720 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%4552 = torch.aten.matmul %4541, %4551 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4553 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%4554 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4555 = torch.aten.pow.Tensor_Tensor %4553, %4554 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%4556 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3721 = torch.constant.int 0
%4557 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3722 = torch.constant.none
%float0.000000e00_3723 = torch.constant.float 0.000000e+00
%4558 = torch.aten.full %4557, %float0.000000e00_3723, %none_3722, %none_3722, %none_3722, %none_3722 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3724 = torch.constant.int 1
%4559 = torch.aten.add.Tensor %4558, %4555, %int1_3724 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%4560 = torch.aten.div.Tensor %4552, %4559 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4561 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3725 = torch.constant.int 6
%none_3726 = torch.constant.none
%false_3727 = torch.constant.bool false
%4562 = torch.aten.to.dtype %4560, %int6_3725, %false_3727, %false_3727, %none_3726 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4563 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%4564 = torch.aten.where.self %4561, %4562, %4563 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3728 = torch.constant.int 3
%none_3729 = torch.constant.none
%4565 = torch.aten.softmax.int %4564, %int3_3728, %none_3729 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3730 = torch.constant.int 6
%none_3731 = torch.constant.none
%false_3732 = torch.constant.bool false
%4566 = torch.aten.to.dtype %4565, %int6_3730, %false_3732, %false_3732, %none_3731 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4567 = torch.aten.matmul %4566, %4549 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3733 = torch.constant.int 1
%int2_3734 = torch.constant.int 2
%4568 = torch.aten.transpose.int %4567, %int1_3733, %int2_3734 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%4569 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3735 = torch.constant.int 1
%int7_3736 = torch.constant.int 7
%int1600_3737 = torch.constant.int 1600
%4570 = torch.prim.ListConstruct %int1_3735, %int7_3736, %int1600_3737 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4571 = torch.aten.reshape %4568, %4570 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4572 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3738 = torch.constant.int 7
%int1600_3739 = torch.constant.int 1600
%4573 = torch.prim.ListConstruct %int7_3738, %int1600_3739 : (!torch.int, !torch.int) -> !torch.list<int>
%4574 = torch.aten.reshape %4571, %4573 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3740 = torch.constant.int 0
%int1_3741 = torch.constant.int 1
%4575 = torch.aten.mm %4574, %546 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4576 = torch.aten.add.Tensor %4575, %547, %int1_3741 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4577 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3742 = torch.constant.int 1
%int7_3743 = torch.constant.int 7
%int1600_3744 = torch.constant.int 1600
%4578 = torch.prim.ListConstruct %int1_3742, %int7_3743, %int1600_3744 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4579 = torch.aten.reshape %4576, %4578 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3745 = torch.constant.int 1
%4580 = torch.aten.add.Tensor %4579, %4524, %int1_3745 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3746 = torch.constant.float 9.9999997473787516E-6
%int1600_3747 = torch.constant.int 1600
%4581 = torch.prim.ListConstruct %int1600_3747 : (!torch.int) -> !torch.list<int>
%result0_3748, %result1_3749, %result2_3750 = torch.aten.native_layer_norm %4580, %4581, %548, %549, %float9.999990e-06_3746 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4582 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3751 = torch.constant.int 7
%int1600_3752 = torch.constant.int 1600
%4583 = torch.prim.ListConstruct %int7_3751, %int1600_3752 : (!torch.int, !torch.int) -> !torch.list<int>
%4584 = torch.aten.reshape %result0_3748, %4583 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3753 = torch.constant.int 0
%int1_3754 = torch.constant.int 1
%4585 = torch.aten.mm %4584, %550 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%4586 = torch.aten.add.Tensor %4585, %551, %int1_3754 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%4587 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3755 = torch.constant.int 1
%int7_3756 = torch.constant.int 7
%int6400_3757 = torch.constant.int 6400
%4588 = torch.prim.ListConstruct %int1_3755, %int7_3756, %int6400_3757 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4589 = torch.aten.reshape %4586, %4588 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%4590 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4591 = torch.aten.mul.Tensor %4589, %4590 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4592 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%4593 = torch.aten.pow.Tensor_Tensor %4589, %4592 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4594 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%4595 = torch.aten.mul.Tensor %4593, %4594 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3758 = torch.constant.int 1
%4596 = torch.aten.add.Tensor %4589, %4595, %int1_3758 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4597 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%4598 = torch.aten.mul.Tensor %4596, %4597 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4599 = torch.aten.tanh %4598 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4600 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3759 = torch.constant.int 1
%4601 = torch.aten.add.Tensor %4599, %4600, %int1_3759 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4602 = torch.aten.mul.Tensor %4591, %4601 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4603 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3760 = torch.constant.int 7
%int6400_3761 = torch.constant.int 6400
%4604 = torch.prim.ListConstruct %int7_3760, %int6400_3761 : (!torch.int, !torch.int) -> !torch.list<int>
%4605 = torch.aten.reshape %4602, %4604 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3762 = torch.constant.int 0
%int1_3763 = torch.constant.int 1
%4606 = torch.aten.mm %4605, %552 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4607 = torch.aten.add.Tensor %4606, %553, %int1_3763 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4608 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3764 = torch.constant.int 1
%int7_3765 = torch.constant.int 7
%int1600_3766 = torch.constant.int 1600
%4609 = torch.prim.ListConstruct %int1_3764, %int7_3765, %int1600_3766 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4610 = torch.aten.reshape %4607, %4609 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3767 = torch.constant.int 1
%4611 = torch.aten.add.Tensor %4580, %4610, %int1_3767 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3768 = torch.constant.float 9.9999997473787516E-6
%int1600_3769 = torch.constant.int 1600
%4612 = torch.prim.ListConstruct %int1600_3769 : (!torch.int) -> !torch.list<int>
%result0_3770, %result1_3771, %result2_3772 = torch.aten.native_layer_norm %4611, %4612, %554, %555, %float9.999990e-06_3768 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4613 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3773 = torch.constant.int 7
%int1600_3774 = torch.constant.int 1600
%4614 = torch.prim.ListConstruct %int7_3773, %int1600_3774 : (!torch.int, !torch.int) -> !torch.list<int>
%4615 = torch.aten.reshape %result0_3770, %4614 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3775 = torch.constant.int 0
%int1_3776 = torch.constant.int 1
%4616 = torch.aten.mm %4615, %556 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%4617 = torch.aten.add.Tensor %4616, %557, %int1_3776 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%4618 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3777 = torch.constant.int 1
%int7_3778 = torch.constant.int 7
%int4800_3779 = torch.constant.int 4800
%4619 = torch.prim.ListConstruct %int1_3777, %int7_3778, %int4800_3779 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4620 = torch.aten.reshape %4617, %4619 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%4621 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%4622 = torch.prim.tolist(%4621) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3780 = torch.constant.int 2
%4623 = torch.aten.split_with_sizes %4620, %4622, %int2_3780 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%4624:3 = torch.prim.ListUnpack %4623 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%4625 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3781 = torch.constant.int 1
%int7_3782 = torch.constant.int 7
%int25_3783 = torch.constant.int 25
%int64_3784 = torch.constant.int 64
%4626 = torch.prim.ListConstruct %int1_3781, %int7_3782, %int25_3783, %int64_3784 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4627 = torch.aten.reshape %4624#0, %4626 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3785 = torch.constant.int 1
%int2_3786 = torch.constant.int 2
%4628 = torch.aten.transpose.int %4627, %int1_3785, %int2_3786 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4629 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3787 = torch.constant.int 1
%int7_3788 = torch.constant.int 7
%int25_3789 = torch.constant.int 25
%int64_3790 = torch.constant.int 64
%4630 = torch.prim.ListConstruct %int1_3787, %int7_3788, %int25_3789, %int64_3790 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4631 = torch.aten.reshape %4624#1, %4630 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3791 = torch.constant.int 1
%int2_3792 = torch.constant.int 2
%4632 = torch.aten.transpose.int %4631, %int1_3791, %int2_3792 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4633 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3793 = torch.constant.int 1
%int7_3794 = torch.constant.int 7
%int25_3795 = torch.constant.int 25
%int64_3796 = torch.constant.int 64
%4634 = torch.prim.ListConstruct %int1_3793, %int7_3794, %int25_3795, %int64_3796 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4635 = torch.aten.reshape %4624#2, %4634 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3797 = torch.constant.int 1
%int2_3798 = torch.constant.int 2
%4636 = torch.aten.transpose.int %4635, %int1_3797, %int2_3798 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3799 = torch.constant.int 1
%int2_3800 = torch.constant.int 2
%4637 = torch.aten.transpose.int %4631, %int1_3799, %int2_3800 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3801 = torch.constant.int 2
%int3_3802 = torch.constant.int 3
%4638 = torch.aten.transpose.int %4637, %int2_3801, %int3_3802 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%4639 = torch.aten.matmul %4628, %4638 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4640 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%4641 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4642 = torch.aten.pow.Tensor_Tensor %4640, %4641 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%4643 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3803 = torch.constant.int 0
%4644 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3804 = torch.constant.none
%float0.000000e00_3805 = torch.constant.float 0.000000e+00
%4645 = torch.aten.full %4644, %float0.000000e00_3805, %none_3804, %none_3804, %none_3804, %none_3804 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3806 = torch.constant.int 1
%4646 = torch.aten.add.Tensor %4645, %4642, %int1_3806 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%4647 = torch.aten.div.Tensor %4639, %4646 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4648 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3807 = torch.constant.int 6
%none_3808 = torch.constant.none
%false_3809 = torch.constant.bool false
%4649 = torch.aten.to.dtype %4647, %int6_3807, %false_3809, %false_3809, %none_3808 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4650 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%4651 = torch.aten.where.self %4648, %4649, %4650 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3810 = torch.constant.int 3
%none_3811 = torch.constant.none
%4652 = torch.aten.softmax.int %4651, %int3_3810, %none_3811 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3812 = torch.constant.int 6
%none_3813 = torch.constant.none
%false_3814 = torch.constant.bool false
%4653 = torch.aten.to.dtype %4652, %int6_3812, %false_3814, %false_3814, %none_3813 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4654 = torch.aten.matmul %4653, %4636 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3815 = torch.constant.int 1
%int2_3816 = torch.constant.int 2
%4655 = torch.aten.transpose.int %4654, %int1_3815, %int2_3816 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%4656 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3817 = torch.constant.int 1
%int7_3818 = torch.constant.int 7
%int1600_3819 = torch.constant.int 1600
%4657 = torch.prim.ListConstruct %int1_3817, %int7_3818, %int1600_3819 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4658 = torch.aten.reshape %4655, %4657 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4659 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3820 = torch.constant.int 7
%int1600_3821 = torch.constant.int 1600
%4660 = torch.prim.ListConstruct %int7_3820, %int1600_3821 : (!torch.int, !torch.int) -> !torch.list<int>
%4661 = torch.aten.reshape %4658, %4660 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3822 = torch.constant.int 0
%int1_3823 = torch.constant.int 1
%4662 = torch.aten.mm %4661, %558 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4663 = torch.aten.add.Tensor %4662, %559, %int1_3823 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4664 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3824 = torch.constant.int 1
%int7_3825 = torch.constant.int 7
%int1600_3826 = torch.constant.int 1600
%4665 = torch.prim.ListConstruct %int1_3824, %int7_3825, %int1600_3826 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4666 = torch.aten.reshape %4663, %4665 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3827 = torch.constant.int 1
%4667 = torch.aten.add.Tensor %4666, %4611, %int1_3827 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3828 = torch.constant.float 9.9999997473787516E-6
%int1600_3829 = torch.constant.int 1600
%4668 = torch.prim.ListConstruct %int1600_3829 : (!torch.int) -> !torch.list<int>
%result0_3830, %result1_3831, %result2_3832 = torch.aten.native_layer_norm %4667, %4668, %560, %561, %float9.999990e-06_3828 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4669 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3833 = torch.constant.int 7
%int1600_3834 = torch.constant.int 1600
%4670 = torch.prim.ListConstruct %int7_3833, %int1600_3834 : (!torch.int, !torch.int) -> !torch.list<int>
%4671 = torch.aten.reshape %result0_3830, %4670 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3835 = torch.constant.int 0
%int1_3836 = torch.constant.int 1
%4672 = torch.aten.mm %4671, %562 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%4673 = torch.aten.add.Tensor %4672, %563, %int1_3836 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%4674 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3837 = torch.constant.int 1
%int7_3838 = torch.constant.int 7
%int6400_3839 = torch.constant.int 6400
%4675 = torch.prim.ListConstruct %int1_3837, %int7_3838, %int6400_3839 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4676 = torch.aten.reshape %4673, %4675 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%4677 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4678 = torch.aten.mul.Tensor %4676, %4677 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4679 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%4680 = torch.aten.pow.Tensor_Tensor %4676, %4679 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4681 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%4682 = torch.aten.mul.Tensor %4680, %4681 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3840 = torch.constant.int 1
%4683 = torch.aten.add.Tensor %4676, %4682, %int1_3840 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4684 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%4685 = torch.aten.mul.Tensor %4683, %4684 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4686 = torch.aten.tanh %4685 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4687 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3841 = torch.constant.int 1
%4688 = torch.aten.add.Tensor %4686, %4687, %int1_3841 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4689 = torch.aten.mul.Tensor %4678, %4688 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4690 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3842 = torch.constant.int 7
%int6400_3843 = torch.constant.int 6400
%4691 = torch.prim.ListConstruct %int7_3842, %int6400_3843 : (!torch.int, !torch.int) -> !torch.list<int>
%4692 = torch.aten.reshape %4689, %4691 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3844 = torch.constant.int 0
%int1_3845 = torch.constant.int 1
%4693 = torch.aten.mm %4692, %564 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4694 = torch.aten.add.Tensor %4693, %565, %int1_3845 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4695 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3846 = torch.constant.int 1
%int7_3847 = torch.constant.int 7
%int1600_3848 = torch.constant.int 1600
%4696 = torch.prim.ListConstruct %int1_3846, %int7_3847, %int1600_3848 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4697 = torch.aten.reshape %4694, %4696 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3849 = torch.constant.int 1
%4698 = torch.aten.add.Tensor %4667, %4697, %int1_3849 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3850 = torch.constant.float 9.9999997473787516E-6
%int1600_3851 = torch.constant.int 1600
%4699 = torch.prim.ListConstruct %int1600_3851 : (!torch.int) -> !torch.list<int>
%result0_3852, %result1_3853, %result2_3854 = torch.aten.native_layer_norm %4698, %4699, %566, %567, %float9.999990e-06_3850 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4700 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3855 = torch.constant.int 7
%int1600_3856 = torch.constant.int 1600
%4701 = torch.prim.ListConstruct %int7_3855, %int1600_3856 : (!torch.int, !torch.int) -> !torch.list<int>
%4702 = torch.aten.reshape %result0_3852, %4701 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3857 = torch.constant.int 0
%int1_3858 = torch.constant.int 1
%4703 = torch.aten.mm %4702, %568 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,4800],f32> -> !torch.vtensor<[7,4800],f32>
%4704 = torch.aten.add.Tensor %4703, %569, %int1_3858 : !torch.vtensor<[7,4800],f32>, !torch.vtensor<[4800],f32>, !torch.int -> !torch.vtensor<[7,4800],f32>
%4705 = torch.vtensor.literal(dense<[1, 7, 4800]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3859 = torch.constant.int 1
%int7_3860 = torch.constant.int 7
%int4800_3861 = torch.constant.int 4800
%4706 = torch.prim.ListConstruct %int1_3859, %int7_3860, %int4800_3861 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4707 = torch.aten.reshape %4704, %4706 : !torch.vtensor<[7,4800],f32>, !torch.list<int> -> !torch.vtensor<[1,7,4800],f32>
%4708 = torch.vtensor.literal(dense<1600> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%4709 = torch.prim.tolist(%4708) : !torch.vtensor<[3],si64> -> !torch.list<int>
%int2_3862 = torch.constant.int 2
%4710 = torch.aten.split_with_sizes %4707, %4709, %int2_3862 : !torch.vtensor<[1,7,4800],f32>, !torch.list<int>, !torch.int -> !torch.list<vtensor<[1,7,1600],f32>>
%4711:3 = torch.prim.ListUnpack %4710 : !torch.list<vtensor<[1,7,1600],f32>> -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>
%4712 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3863 = torch.constant.int 1
%int7_3864 = torch.constant.int 7
%int25_3865 = torch.constant.int 25
%int64_3866 = torch.constant.int 64
%4713 = torch.prim.ListConstruct %int1_3863, %int7_3864, %int25_3865, %int64_3866 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4714 = torch.aten.reshape %4711#0, %4713 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3867 = torch.constant.int 1
%int2_3868 = torch.constant.int 2
%4715 = torch.aten.transpose.int %4714, %int1_3867, %int2_3868 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4716 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3869 = torch.constant.int 1
%int7_3870 = torch.constant.int 7
%int25_3871 = torch.constant.int 25
%int64_3872 = torch.constant.int 64
%4717 = torch.prim.ListConstruct %int1_3869, %int7_3870, %int25_3871, %int64_3872 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4718 = torch.aten.reshape %4711#1, %4717 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3873 = torch.constant.int 1
%int2_3874 = torch.constant.int 2
%4719 = torch.aten.transpose.int %4718, %int1_3873, %int2_3874 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%4720 = torch.vtensor.literal(dense<[1, 7, 25, 64]> : tensor<4xsi64>) : !torch.vtensor<[4],si64>
%int1_3875 = torch.constant.int 1
%int7_3876 = torch.constant.int 7
%int25_3877 = torch.constant.int 25
%int64_3878 = torch.constant.int 64
%4721 = torch.prim.ListConstruct %int1_3875, %int7_3876, %int25_3877, %int64_3878 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4722 = torch.aten.reshape %4711#2, %4721 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,25,64],f32>
%int1_3879 = torch.constant.int 1
%int2_3880 = torch.constant.int 2
%4723 = torch.aten.transpose.int %4722, %int1_3879, %int2_3880 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int1_3881 = torch.constant.int 1
%int2_3882 = torch.constant.int 2
%4724 = torch.aten.transpose.int %4718, %int1_3881, %int2_3882 : !torch.vtensor<[1,7,25,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,7,64],f32>
%int2_3883 = torch.constant.int 2
%int3_3884 = torch.constant.int 3
%4725 = torch.aten.transpose.int %4724, %int2_3883, %int3_3884 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,25,64,7],f32>
%4726 = torch.aten.matmul %4715, %4725 : !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,64,7],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4727 = torch.vtensor.literal(dense<6.400000e+01> : tensor<f32>) : !torch.vtensor<[],f32>
%4728 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4729 = torch.aten.pow.Tensor_Tensor %4727, %4728 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[],f32>
%4730 = torch.vtensor.literal(dense<> : tensor<0xsi64>) : !torch.vtensor<[0],si64>
%int0_3885 = torch.constant.int 0
%4731 = torch.prim.ListConstruct : () -> !torch.list<int>
%none_3886 = torch.constant.none
%float0.000000e00_3887 = torch.constant.float 0.000000e+00
%4732 = torch.aten.full %4731, %float0.000000e00_3887, %none_3886, %none_3886, %none_3886, %none_3886 : !torch.list<int>, !torch.float, !torch.none, !torch.none, !torch.none, !torch.none -> !torch.vtensor<[],f32>
%int1_3888 = torch.constant.int 1
%4733 = torch.aten.add.Tensor %4732, %4729, %int1_3888 : !torch.vtensor<[],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[],f32>
%4734 = torch.aten.div.Tensor %4726, %4733 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%4735 = torch.vtensor.literal(dense_resource<__elided__> : tensor<1x1x7x7xi1>) : !torch.vtensor<[1,1,7,7],i1>
%int6_3889 = torch.constant.int 6
%none_3890 = torch.constant.none
%false_3891 = torch.constant.bool false
%4736 = torch.aten.to.dtype %4734, %int6_3889, %false_3891, %false_3891, %none_3890 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4737 = torch.vtensor.literal(dense<-3.40282347E+38> : tensor<f32>) : !torch.vtensor<[],f32>
%4738 = torch.aten.where.self %4735, %4736, %4737 : !torch.vtensor<[1,1,7,7],i1>, !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,25,7,7],f32>
%int3_3892 = torch.constant.int 3
%none_3893 = torch.constant.none
%4739 = torch.aten.softmax.int %4738, %int3_3892, %none_3893 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%int6_3894 = torch.constant.int 6
%none_3895 = torch.constant.none
%false_3896 = torch.constant.bool false
%4740 = torch.aten.to.dtype %4739, %int6_3894, %false_3896, %false_3896, %none_3895 : !torch.vtensor<[1,25,7,7],f32>, !torch.int, !torch.bool, !torch.bool, !torch.none -> !torch.vtensor<[1,25,7,7],f32>
%4741 = torch.aten.matmul %4740, %4723 : !torch.vtensor<[1,25,7,7],f32>, !torch.vtensor<[1,25,7,64],f32> -> !torch.vtensor<[1,25,7,64],f32>
%int1_3897 = torch.constant.int 1
%int2_3898 = torch.constant.int 2
%4742 = torch.aten.transpose.int %4741, %int1_3897, %int2_3898 : !torch.vtensor<[1,25,7,64],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,7,25,64],f32>
%4743 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3899 = torch.constant.int 1
%int7_3900 = torch.constant.int 7
%int1600_3901 = torch.constant.int 1600
%4744 = torch.prim.ListConstruct %int1_3899, %int7_3900, %int1600_3901 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4745 = torch.aten.reshape %4742, %4744 : !torch.vtensor<[1,7,25,64],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4746 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3902 = torch.constant.int 7
%int1600_3903 = torch.constant.int 1600
%4747 = torch.prim.ListConstruct %int7_3902, %int1600_3903 : (!torch.int, !torch.int) -> !torch.list<int>
%4748 = torch.aten.reshape %4745, %4747 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3904 = torch.constant.int 0
%int1_3905 = torch.constant.int 1
%4749 = torch.aten.mm %4748, %570 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4750 = torch.aten.add.Tensor %4749, %571, %int1_3905 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4751 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3906 = torch.constant.int 1
%int7_3907 = torch.constant.int 7
%int1600_3908 = torch.constant.int 1600
%4752 = torch.prim.ListConstruct %int1_3906, %int7_3907, %int1600_3908 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4753 = torch.aten.reshape %4750, %4752 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3909 = torch.constant.int 1
%4754 = torch.aten.add.Tensor %4753, %4698, %int1_3909 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3910 = torch.constant.float 9.9999997473787516E-6
%int1600_3911 = torch.constant.int 1600
%4755 = torch.prim.ListConstruct %int1600_3911 : (!torch.int) -> !torch.list<int>
%result0_3912, %result1_3913, %result2_3914 = torch.aten.native_layer_norm %4754, %4755, %572, %573, %float9.999990e-06_3910 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4756 = torch.vtensor.literal(dense<[-1, 1600]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3915 = torch.constant.int 7
%int1600_3916 = torch.constant.int 1600
%4757 = torch.prim.ListConstruct %int7_3915, %int1600_3916 : (!torch.int, !torch.int) -> !torch.list<int>
%4758 = torch.aten.reshape %result0_3912, %4757 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[7,1600],f32>
%int0_3917 = torch.constant.int 0
%int1_3918 = torch.constant.int 1
%4759 = torch.aten.mm %4758, %574 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600,6400],f32> -> !torch.vtensor<[7,6400],f32>
%4760 = torch.aten.add.Tensor %4759, %575, %int1_3918 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400],f32>, !torch.int -> !torch.vtensor<[7,6400],f32>
%4761 = torch.vtensor.literal(dense<[1, 7, 6400]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3919 = torch.constant.int 1
%int7_3920 = torch.constant.int 7
%int6400_3921 = torch.constant.int 6400
%4762 = torch.prim.ListConstruct %int1_3919, %int7_3920, %int6400_3921 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4763 = torch.aten.reshape %4760, %4762 : !torch.vtensor<[7,6400],f32>, !torch.list<int> -> !torch.vtensor<[1,7,6400],f32>
%4764 = torch.vtensor.literal(dense<5.000000e-01> : tensor<f32>) : !torch.vtensor<[],f32>
%4765 = torch.aten.mul.Tensor %4763, %4764 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4766 = torch.vtensor.literal(dense<3.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%4767 = torch.aten.pow.Tensor_Tensor %4763, %4766 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4768 = torch.vtensor.literal(dense<4.471500e-02> : tensor<f32>) : !torch.vtensor<[],f32>
%4769 = torch.aten.mul.Tensor %4767, %4768 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%int1_3922 = torch.constant.int 1
%4770 = torch.aten.add.Tensor %4763, %4769, %int1_3922 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4771 = torch.vtensor.literal(dense<0.797884583> : tensor<f32>) : !torch.vtensor<[],f32>
%4772 = torch.aten.mul.Tensor %4770, %4771 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32> -> !torch.vtensor<[1,7,6400],f32>
%4773 = torch.aten.tanh %4772 : !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4774 = torch.vtensor.literal(dense<1.000000e+00> : tensor<f32>) : !torch.vtensor<[],f32>
%int1_3923 = torch.constant.int 1
%4775 = torch.aten.add.Tensor %4773, %4774, %int1_3923 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[],f32>, !torch.int -> !torch.vtensor<[1,7,6400],f32>
%4776 = torch.aten.mul.Tensor %4765, %4775 : !torch.vtensor<[1,7,6400],f32>, !torch.vtensor<[1,7,6400],f32> -> !torch.vtensor<[1,7,6400],f32>
%4777 = torch.vtensor.literal(dense<[-1, 6400]> : tensor<2xsi64>) : !torch.vtensor<[2],si64>
%int7_3924 = torch.constant.int 7
%int6400_3925 = torch.constant.int 6400
%4778 = torch.prim.ListConstruct %int7_3924, %int6400_3925 : (!torch.int, !torch.int) -> !torch.list<int>
%4779 = torch.aten.reshape %4776, %4778 : !torch.vtensor<[1,7,6400],f32>, !torch.list<int> -> !torch.vtensor<[7,6400],f32>
%int0_3926 = torch.constant.int 0
%int1_3927 = torch.constant.int 1
%4780 = torch.aten.mm %4779, %576 : !torch.vtensor<[7,6400],f32>, !torch.vtensor<[6400,1600],f32> -> !torch.vtensor<[7,1600],f32>
%4781 = torch.aten.add.Tensor %4780, %577, %int1_3927 : !torch.vtensor<[7,1600],f32>, !torch.vtensor<[1600],f32>, !torch.int -> !torch.vtensor<[7,1600],f32>
%4782 = torch.vtensor.literal(dense<[1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3928 = torch.constant.int 1
%int7_3929 = torch.constant.int 7
%int1600_3930 = torch.constant.int 1600
%4783 = torch.prim.ListConstruct %int1_3928, %int7_3929, %int1600_3930 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4784 = torch.aten.reshape %4781, %4783 : !torch.vtensor<[7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%int1_3931 = torch.constant.int 1
%4785 = torch.aten.add.Tensor %4754, %4784, %int1_3931 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1600],f32>, !torch.int -> !torch.vtensor<[1,7,1600],f32>
%float9.999990e-06_3932 = torch.constant.float 9.9999997473787516E-6
%int1600_3933 = torch.constant.int 1600
%4786 = torch.prim.ListConstruct %int1600_3933 : (!torch.int) -> !torch.list<int>
%result0_3934, %result1_3935, %result2_3936 = torch.aten.native_layer_norm %4785, %4786, %578, %579, %float9.999990e-06_3932 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int>, !torch.vtensor<[1600],f32>, !torch.vtensor<[1600],f32>, !torch.float -> !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1,7,1],f32>, !torch.vtensor<[1,7,1],f32>
%4787 = torch.vtensor.literal(dense<[-1, 7, 1600]> : tensor<3xsi64>) : !torch.vtensor<[3],si64>
%int1_3937 = torch.constant.int 1
%int7_3938 = torch.constant.int 7
%int1600_3939 = torch.constant.int 1600
%4788 = torch.prim.ListConstruct %int1_3937, %int7_3938, %int1600_3939 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int>
%4789 = torch.aten.reshape %result0_3934, %4788 : !torch.vtensor<[1,7,1600],f32>, !torch.list<int> -> !torch.vtensor<[1,7,1600],f32>
%4790 = torch.aten.matmul %4789, %580 : !torch.vtensor<[1,7,1600],f32>, !torch.vtensor<[1600,50257],f32> -> !torch.vtensor<[1,7,50257],f32>
return %4790, %630, %634, %717, %721, %804, %808, %891, %895, %978, %982, %1065, %1069, %1152, %1156, %1239, %1243, %1326, %1330, %1413, %1417, %1500, %1504, %1587, %1591, %1674, %1678, %1761, %1765, %1848, %1852, %1935, %1939, %2022, %2026, %2109, %2113, %2196, %2200, %2283, %2287, %2370, %2374, %2457, %2461, %2544, %2548, %2631, %2635, %2718, %2722, %2805, %2809, %2892, %2896, %2979, %2983, %3066, %3070, %3153, %3157, %3240, %3244, %3327, %3331, %3414, %3418, %3501, %3505, %3588, %3592, %3675, %3679, %3762, %3766, %3849, %3853, %3936, %3940, %4023, %4027, %4110, %4114, %4197, %4201, %4284, %4288, %4371, %4375, %4458, %4462, %4545, %4549, %4632, %4636, %4719, %4723 : !torch.vtensor<[1,7,50257],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>, !torch.vtensor<[1,25,7,64],f32>
}
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment