Created
April 5, 2022 15:40
-
-
Save pashu123/250dc2d8c8ecfd26be7d1827c943138e to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
module attributes {torch.debug_module_name = "GraphModule"} { | |
func private @__torch__.torch.fx.graph_module.___torch_mangle_2.GraphModule.forward(%arg0: !torch.nn.Module<"__torch__.torch.fx.graph_module.___torch_mangle_2.GraphModule">, %arg1: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg2: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg3: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg4: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg5: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg6: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg7: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg8: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg9: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg10: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg11: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg12: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg13: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg14: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg15: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg16: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg17: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg18: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg19: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg20: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg21: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg22: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg23: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg24: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg25: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg26: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg27: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg28: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg29: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg30: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg31: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg32: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg33: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg34: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg35: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg36: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg37: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg38: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg39: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg40: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg41: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg42: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg43: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg44: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg45: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg46: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg47: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg48: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg49: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg50: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg51: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg52: !torch.tensor {torch.type_bound = !torch.vtensor<[768],f32>}, %arg53: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512],si64>}, %arg54: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512],si64>}, %arg55: !torch.tensor {torch.type_bound = !torch.vtensor<[1,512],si64>}, %arg56: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg57: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg58: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg59: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg60: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg61: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg62: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg63: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg64: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg65: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg66: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg67: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg68: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg69: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg70: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg71: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg72: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg73: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg74: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg75: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg76: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg77: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg78: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg79: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg80: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg81: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg82: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg83: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg84: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg85: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg86: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg87: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg88: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg89: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg90: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg91: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg92: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg93: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg94: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg95: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg96: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg97: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg98: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg99: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg100: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg101: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg102: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg103: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg104: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg105: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg106: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg107: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg108: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg109: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg110: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg111: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg112: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg113: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg114: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg115: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg116: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg117: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg118: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg119: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg120: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg121: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg122: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg123: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg124: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg125: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg126: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg127: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg128: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg129: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg130: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg131: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg132: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg133: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg134: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg135: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg136: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg137: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg138: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg139: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg140: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg141: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg142: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg143: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg144: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg145: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg146: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg147: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg148: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg149: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg150: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg151: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg152: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg153: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg154: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg155: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg156: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg157: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg158: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg159: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg160: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg161: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg162: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg163: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg164: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg165: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg166: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg167: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg168: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg169: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg170: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg171: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg172: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg173: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg174: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg175: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg176: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg177: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg178: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg179: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg180: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg181: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg182: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg183: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg184: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg185: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg186: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg187: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg188: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg189: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg190: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg191: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg192: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg193: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg194: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg195: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg196: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg197: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg198: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg199: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg200: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg201: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg202: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg203: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg204: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg205: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg206: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg207: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg208: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg209: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg210: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg211: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg212: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg213: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg214: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg215: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg216: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg217: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg218: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg219: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg220: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg221: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg222: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg223: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg224: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg225: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg226: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg227: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg228: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg229: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg230: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg231: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg232: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg233: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg234: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg235: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg236: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg237: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg238: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg239: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg240: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg241: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg242: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg243: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg244: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg245: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg246: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg247: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg248: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg249: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg250: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg251: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg252: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg253: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg254: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg255: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg256: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg257: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg258: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg259: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg260: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg261: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg262: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg263: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg264: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg265: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg266: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg267: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg268: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg269: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg270: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg271: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg272: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg273: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg274: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg275: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg276: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg277: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg278: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg279: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg280: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg281: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg282: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg283: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg284: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg285: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg286: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg287: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg288: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg289: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg290: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg291: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg292: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg293: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg294: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg295: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg296: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg297: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg298: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg299: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg300: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg301: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg302: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg303: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg304: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg305: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg306: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg307: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg308: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg309: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg310: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg311: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg312: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg313: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg314: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg315: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg316: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg317: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg318: !torch.tensor {torch.type_bound = !torch.vtensor<[48,64,512],f32>}, %arg319: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg320: !torch.tensor {torch.type_bound = !torch.vtensor<[4,12,512,512],f32>}, %arg321: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,512],f32>}, %arg322: !torch.tensor {torch.type_bound = !torch.vtensor<[48,512,64],f32>}, %arg323: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg324: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg325: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg326: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg327: !torch.tensor {torch.type_bound = !torch.vtensor<[768,3072],f32>}, %arg328: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg329: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,3072],f32>}, %arg330: !torch.tensor {torch.type_bound = !torch.vtensor<[3072,768],f32>}, %arg331: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,3072],f32>}, %arg332: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg333: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg334: !torch.tensor {torch.type_bound = !torch.vtensor<[768,768],f32>}, %arg335: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg336: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg337: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,768],f32>}, %arg338: !torch.tensor {torch.type_bound = !torch.vtensor<[768,30522],f32>}, %arg339: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,768],f32>}, %arg340: !torch.tensor {torch.type_bound = !torch.vtensor<[2048],si64>}, %arg341: !torch.tensor {torch.type_bound = !torch.vtensor<[2048,30522],f32>}, %arg342: !torch.tensor {torch.type_bound = !torch.vtensor<[],f32>}, %arg343: !torch.tensor {torch.type_bound = !torch.vtensor<[4,512,30522],f32>}) -> !torch.tuple<tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor> { | |
%cpu = torch.constant.device "cpu" | |
%1 = torch.tensor.literal(dense<8.000000e+00> : tensor<f64>) : !torch.tensor<[],f64> | |
%str = torch.constant.str "none" | |
%false = torch.constant.bool false | |
%2 = torch.tensor.literal(dense<768> : tensor<si64>) : !torch.tensor<[],si64> | |
%true = torch.constant.bool true | |
%none = torch.constant.none | |
%int768 = torch.constant.int 768 | |
%float9.999990e-13 = torch.constant.float 9.9999999999999998E-13 | |
%int1 = torch.constant.int 1 | |
%int-100 = torch.constant.int -100 | |
%int6 = torch.constant.int 6 | |
%int4 = torch.constant.int 4 | |
%int512 = torch.constant.int 512 | |
%int30522 = torch.constant.int 30522 | |
%int2048 = torch.constant.int 2048 | |
%int0 = torch.constant.int 0 | |
%int2 = torch.constant.int 2 | |
%int3072 = torch.constant.int 3072 | |
%int12 = torch.constant.int 12 | |
%int64 = torch.constant.int 64 | |
%int3 = torch.constant.int 3 | |
%int48 = torch.constant.int 48 | |
%int-1 = torch.constant.int -1 | |
%int-2 = torch.constant.int -2 | |
%3 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0, %result1, %result2 = torch.aten.native_layer_norm %arg56, %3, %arg2, %arg1, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%4 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_0, %result1_1, %result2_2 = torch.aten.native_layer_norm %arg73, %4, %arg4, %arg3, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%5 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_3, %result1_4, %result2_5 = torch.aten.native_layer_norm %arg80, %5, %arg6, %arg5, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%6 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_6, %result1_7, %result2_8 = torch.aten.native_layer_norm %arg96, %6, %arg8, %arg7, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%7 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_9, %result1_10, %result2_11 = torch.aten.native_layer_norm %arg103, %7, %arg10, %arg9, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%8 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_12, %result1_13, %result2_14 = torch.aten.native_layer_norm %arg119, %8, %arg20, %arg19, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%9 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_15, %result1_16, %result2_17 = torch.aten.native_layer_norm %arg126, %9, %arg22, %arg21, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%10 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_18, %result1_19, %result2_20 = torch.aten.native_layer_norm %arg142, %10, %arg24, %arg23, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%11 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_21, %result1_22, %result2_23 = torch.aten.native_layer_norm %arg149, %11, %arg26, %arg25, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%12 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_24, %result1_25, %result2_26 = torch.aten.native_layer_norm %arg165, %12, %arg28, %arg27, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%13 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_27, %result1_28, %result2_29 = torch.aten.native_layer_norm %arg172, %13, %arg30, %arg29, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%14 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_30, %result1_31, %result2_32 = torch.aten.native_layer_norm %arg188, %14, %arg32, %arg31, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%15 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_33, %result1_34, %result2_35 = torch.aten.native_layer_norm %arg195, %15, %arg34, %arg33, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%16 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_36, %result1_37, %result2_38 = torch.aten.native_layer_norm %arg211, %16, %arg36, %arg35, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%17 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_39, %result1_40, %result2_41 = torch.aten.native_layer_norm %arg218, %17, %arg38, %arg37, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%18 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_42, %result1_43, %result2_44 = torch.aten.native_layer_norm %arg234, %18, %arg40, %arg39, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%19 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_45, %result1_46, %result2_47 = torch.aten.native_layer_norm %arg241, %19, %arg42, %arg41, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%20 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_48, %result1_49, %result2_50 = torch.aten.native_layer_norm %arg257, %20, %arg44, %arg43, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%21 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_51, %result1_52, %result2_53 = torch.aten.native_layer_norm %arg264, %21, %arg46, %arg45, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%22 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_54, %result1_55, %result2_56 = torch.aten.native_layer_norm %arg280, %22, %arg48, %arg47, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%23 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_57, %result1_58, %result2_59 = torch.aten.native_layer_norm %arg287, %23, %arg50, %arg49, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%24 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_60, %result1_61, %result2_62 = torch.aten.native_layer_norm %arg303, %24, %arg12, %arg11, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%25 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_63, %result1_64, %result2_65 = torch.aten.native_layer_norm %arg310, %25, %arg14, %arg13, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%26 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_66, %result1_67, %result2_68 = torch.aten.native_layer_norm %arg326, %26, %arg16, %arg15, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%27 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_69, %result1_70, %result2_71 = torch.aten.native_layer_norm %arg333, %27, %arg18, %arg17, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%28 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%result0_72, %result1_73, %result2_74 = torch.aten.native_layer_norm %arg337, %28, %arg52, %arg51, %float9.999990e-13 : !torch.tensor, !torch.list<int>, !torch.tensor, !torch.tensor, !torch.float -> !torch.tensor, !torch.tensor, !torch.tensor | |
%output, %total_weight = torch.aten.nll_loss_forward %arg341, %arg340, %none, %int1, %int-100 : !torch.tensor, !torch.tensor, !torch.none, !torch.int, !torch.int -> !torch.tensor, !torch.tensor | |
%29 = torch.aten.nll_loss_backward %arg342, %arg341, %arg340, %none, %int1, %int-100, %total_weight : !torch.tensor, !torch.tensor, !torch.tensor, !torch.none, !torch.int, !torch.int, !torch.tensor -> !torch.tensor | |
%30 = torch.aten._log_softmax_backward_data %29, %arg341, %int1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%31 = torch.prim.ListConstruct %int4, %int512, %int30522 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%32 = torch.aten.view %30, %31 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%non = torch.aten.view %30, %31 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%33 = torch.aten.add.Tensor %arg343, %32, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%34 = torch.prim.ListConstruct %int2048, %int30522 : (!torch.int, !torch.int) -> !torch.list<int> | |
%35 = torch.aten.view %33, %34 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%36 = torch.aten.t %arg338 : !torch.tensor -> !torch.tensor | |
%37 = torch.aten.mm %35, %36 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%38 = torch.aten.t %35 : !torch.tensor -> !torch.tensor | |
%39 = torch.aten.mm %38, %arg339 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%40 = torch.aten.t %39 : !torch.tensor -> !torch.tensor | |
%41 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%42 = torch.aten.sum.dim_IntList %35, %41, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%43 = torch.prim.ListConstruct %int30522 : (!torch.int) -> !torch.list<int> | |
%44 = torch.aten.view %42, %43 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%45 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%46 = torch.aten.view %37, %45 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%47 = torch.aten.t %40 : !torch.tensor -> !torch.tensor | |
%48 = torch.aten.sub.Tensor %arg337, %result1_73, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%49 = torch.aten.mul.Tensor %48, %result2_74 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%50 = torch.aten.mul.Tensor %46, %arg52 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%51 = torch.aten.mul.Tensor %50, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%52 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%53 = torch.aten.sum.dim_IntList %50, %52, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%54 = torch.aten.mul.Tensor %50, %49 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%55 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%56 = torch.aten.sum.dim_IntList %54, %55, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%57 = torch.aten.mul.Tensor %49, %56 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%58 = torch.aten.sub.Tensor %51, %53, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%59 = torch.aten.sub.Tensor %58, %57, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%60 = torch.aten.div.Tensor %result2_74, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%61 = torch.aten.mul.Tensor %60, %59 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%62 = torch.aten.mul.Tensor %46, %49 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%63 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%64 = torch.aten.sum.dim_IntList %62, %63, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%65 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%66 = torch.aten.sum.dim_IntList %46, %65, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%67 = torch.aten.gelu_backward %61, %arg336, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%68 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%69 = torch.aten.view %67, %68 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%70 = torch.aten.t %arg334 : !torch.tensor -> !torch.tensor | |
%71 = torch.aten.mm %69, %70 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%72 = torch.aten.t %69 : !torch.tensor -> !torch.tensor | |
%73 = torch.aten.mm %72, %arg335 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%74 = torch.aten.t %73 : !torch.tensor -> !torch.tensor | |
%75 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%76 = torch.aten.sum.dim_IntList %69, %75, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%77 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%78 = torch.aten.view %76, %77 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%79 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%80 = torch.aten.view %71, %79 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%81 = torch.aten.t %74 : !torch.tensor -> !torch.tensor | |
%82 = torch.aten.sub.Tensor %arg333, %result1_70, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%83 = torch.aten.mul.Tensor %82, %result2_71 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%84 = torch.aten.mul.Tensor %80, %arg18 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%85 = torch.aten.mul.Tensor %84, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%86 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%87 = torch.aten.sum.dim_IntList %84, %86, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%88 = torch.aten.mul.Tensor %84, %83 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%89 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%90 = torch.aten.sum.dim_IntList %88, %89, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%91 = torch.aten.mul.Tensor %83, %90 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%92 = torch.aten.sub.Tensor %85, %87, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%93 = torch.aten.sub.Tensor %92, %91, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%94 = torch.aten.div.Tensor %result2_71, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%95 = torch.aten.mul.Tensor %94, %93 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%96 = torch.aten.mul.Tensor %80, %83 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%97 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%98 = torch.aten.sum.dim_IntList %96, %97, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%99 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%100 = torch.aten.sum.dim_IntList %80, %99, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%101 = torch.aten.mul.Tensor %95, %arg332 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%102 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%103 = torch.aten.view %101, %102 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%104 = torch.aten.t %arg330 : !torch.tensor -> !torch.tensor | |
%105 = torch.aten.mm %103, %104 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%106 = torch.aten.t %103 : !torch.tensor -> !torch.tensor | |
%107 = torch.aten.mm %106, %arg331 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%108 = torch.aten.t %107 : !torch.tensor -> !torch.tensor | |
%109 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%110 = torch.aten.sum.dim_IntList %103, %109, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%111 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%112 = torch.aten.view %110, %111 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%113 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%114 = torch.aten.view %105, %113 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%115 = torch.aten.t %108 : !torch.tensor -> !torch.tensor | |
%116 = torch.aten.gelu_backward %114, %arg329, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%117 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%118 = torch.aten.view %116, %117 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%119 = torch.aten.t %arg327 : !torch.tensor -> !torch.tensor | |
%120 = torch.aten.mm %118, %119 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%121 = torch.aten.t %118 : !torch.tensor -> !torch.tensor | |
%122 = torch.aten.mm %121, %arg328 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%123 = torch.aten.t %122 : !torch.tensor -> !torch.tensor | |
%124 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%125 = torch.aten.sum.dim_IntList %118, %124, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%126 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%127 = torch.aten.view %125, %126 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%128 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%129 = torch.aten.view %120, %128 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%130 = torch.aten.add.Tensor %95, %129, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%131 = torch.aten.t %123 : !torch.tensor -> !torch.tensor | |
%132 = torch.aten.sub.Tensor %arg326, %result1_67, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%133 = torch.aten.mul.Tensor %132, %result2_68 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%134 = torch.aten.mul.Tensor %130, %arg16 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%135 = torch.aten.mul.Tensor %134, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%136 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%137 = torch.aten.sum.dim_IntList %134, %136, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%138 = torch.aten.mul.Tensor %134, %133 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%139 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%140 = torch.aten.sum.dim_IntList %138, %139, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%141 = torch.aten.mul.Tensor %133, %140 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%142 = torch.aten.sub.Tensor %135, %137, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%143 = torch.aten.sub.Tensor %142, %141, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%144 = torch.aten.div.Tensor %result2_68, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%145 = torch.aten.mul.Tensor %144, %143 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%146 = torch.aten.mul.Tensor %130, %133 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%147 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%148 = torch.aten.sum.dim_IntList %146, %147, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%149 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%150 = torch.aten.sum.dim_IntList %130, %149, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%151 = torch.aten.mul.Tensor %145, %arg325 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%152 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%153 = torch.aten.view %151, %152 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%154 = torch.aten.t %arg323 : !torch.tensor -> !torch.tensor | |
%155 = torch.aten.mm %153, %154 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%156 = torch.aten.t %153 : !torch.tensor -> !torch.tensor | |
%157 = torch.aten.mm %156, %arg324 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%158 = torch.aten.t %157 : !torch.tensor -> !torch.tensor | |
%159 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%160 = torch.aten.sum.dim_IntList %153, %159, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%161 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%162 = torch.aten.view %160, %161 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%163 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%164 = torch.aten.view %155, %163 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%165 = torch.aten.t %158 : !torch.tensor -> !torch.tensor | |
%166 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%167 = torch.aten.view %164, %166 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%168 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%169 = torch.aten.permute %167, %168 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%170 = torch.aten.clone %169, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%171 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%172 = torch.aten._unsafe_view %170, %171 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%173 = torch.aten.transpose.int %arg321, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%174 = torch.aten.bmm %173, %172 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%175 = torch.aten.transpose.int %arg322, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%176 = torch.aten.bmm %172, %175 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%177 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%178 = torch.aten.view %174, %177 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%179 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%180 = torch.aten.view %176, %179 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%181 = torch.aten.mul.Tensor %180, %arg320 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%182 = torch.aten._softmax_backward_data %181, %arg319, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%183 = torch.aten.div.Tensor %182, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%184 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%185 = torch.aten.view %183, %184 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%186 = torch.aten.transpose.int %arg317, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%187 = torch.aten.bmm %186, %185 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%188 = torch.aten.transpose.int %arg318, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%189 = torch.aten.bmm %185, %188 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%190 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%191 = torch.aten.view %187, %190 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%192 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%193 = torch.aten.view %189, %192 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%194 = torch.aten.transpose.int %191, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%195 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%196 = torch.aten.permute %193, %195 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%197 = torch.aten.clone %196, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%198 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%199 = torch.aten._unsafe_view %197, %198 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%200 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%201 = torch.aten.permute %178, %200 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%202 = torch.aten.clone %201, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%203 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%204 = torch.aten._unsafe_view %202, %203 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%205 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%206 = torch.aten.view %204, %205 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%207 = torch.aten.t %arg315 : !torch.tensor -> !torch.tensor | |
%208 = torch.aten.mm %206, %207 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%209 = torch.aten.t %206 : !torch.tensor -> !torch.tensor | |
%210 = torch.aten.mm %209, %arg316 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%211 = torch.aten.t %210 : !torch.tensor -> !torch.tensor | |
%212 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%213 = torch.aten.sum.dim_IntList %206, %212, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%214 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%215 = torch.aten.view %213, %214 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%216 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%217 = torch.aten.view %208, %216 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%218 = torch.aten.add.Tensor %145, %217, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%219 = torch.aten.t %211 : !torch.tensor -> !torch.tensor | |
%220 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%221 = torch.aten.permute %194, %220 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%222 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%223 = torch.aten.view %221, %222 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%224 = torch.aten.clone %223, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%225 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%226 = torch.aten._unsafe_view %224, %225 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%227 = torch.aten.t %arg313 : !torch.tensor -> !torch.tensor | |
%228 = torch.aten.mm %226, %227 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%229 = torch.aten.t %226 : !torch.tensor -> !torch.tensor | |
%230 = torch.aten.mm %229, %arg314 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%231 = torch.aten.t %230 : !torch.tensor -> !torch.tensor | |
%232 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%233 = torch.aten.sum.dim_IntList %226, %232, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%234 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%235 = torch.aten.view %233, %234 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%236 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%237 = torch.aten.view %228, %236 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%238 = torch.aten.add.Tensor %218, %237, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%239 = torch.aten.t %231 : !torch.tensor -> !torch.tensor | |
%240 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%241 = torch.aten.view %199, %240 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%242 = torch.aten.t %arg311 : !torch.tensor -> !torch.tensor | |
%243 = torch.aten.mm %241, %242 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%244 = torch.aten.t %241 : !torch.tensor -> !torch.tensor | |
%245 = torch.aten.mm %244, %arg312 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%246 = torch.aten.t %245 : !torch.tensor -> !torch.tensor | |
%247 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%248 = torch.aten.sum.dim_IntList %241, %247, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%249 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%250 = torch.aten.view %248, %249 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%251 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%252 = torch.aten.view %243, %251 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%253 = torch.aten.add.Tensor %238, %252, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%254 = torch.aten.t %246 : !torch.tensor -> !torch.tensor | |
%255 = torch.aten.sub.Tensor %arg310, %result1_64, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%256 = torch.aten.mul.Tensor %255, %result2_65 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%257 = torch.aten.mul.Tensor %253, %arg14 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%258 = torch.aten.mul.Tensor %257, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%259 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%260 = torch.aten.sum.dim_IntList %257, %259, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%261 = torch.aten.mul.Tensor %257, %256 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%262 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%263 = torch.aten.sum.dim_IntList %261, %262, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%264 = torch.aten.mul.Tensor %256, %263 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%265 = torch.aten.sub.Tensor %258, %260, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%266 = torch.aten.sub.Tensor %265, %264, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%267 = torch.aten.div.Tensor %result2_65, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%268 = torch.aten.mul.Tensor %267, %266 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%269 = torch.aten.mul.Tensor %253, %256 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%270 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%271 = torch.aten.sum.dim_IntList %269, %270, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%272 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%273 = torch.aten.sum.dim_IntList %253, %272, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%274 = torch.aten.mul.Tensor %268, %arg309 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%275 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%276 = torch.aten.view %274, %275 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%277 = torch.aten.t %arg307 : !torch.tensor -> !torch.tensor | |
%278 = torch.aten.mm %276, %277 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%279 = torch.aten.t %276 : !torch.tensor -> !torch.tensor | |
%280 = torch.aten.mm %279, %arg308 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%281 = torch.aten.t %280 : !torch.tensor -> !torch.tensor | |
%282 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%283 = torch.aten.sum.dim_IntList %276, %282, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%284 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%285 = torch.aten.view %283, %284 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%286 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%287 = torch.aten.view %278, %286 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%288 = torch.aten.t %281 : !torch.tensor -> !torch.tensor | |
%289 = torch.aten.gelu_backward %287, %arg306, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%290 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%291 = torch.aten.view %289, %290 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%292 = torch.aten.t %arg304 : !torch.tensor -> !torch.tensor | |
%293 = torch.aten.mm %291, %292 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%294 = torch.aten.t %291 : !torch.tensor -> !torch.tensor | |
%295 = torch.aten.mm %294, %arg305 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%296 = torch.aten.t %295 : !torch.tensor -> !torch.tensor | |
%297 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%298 = torch.aten.sum.dim_IntList %291, %297, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%299 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%300 = torch.aten.view %298, %299 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%301 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%302 = torch.aten.view %293, %301 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%303 = torch.aten.add.Tensor %268, %302, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%304 = torch.aten.t %296 : !torch.tensor -> !torch.tensor | |
%305 = torch.aten.sub.Tensor %arg303, %result1_61, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%306 = torch.aten.mul.Tensor %305, %result2_62 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%307 = torch.aten.mul.Tensor %303, %arg12 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%308 = torch.aten.mul.Tensor %307, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%309 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%310 = torch.aten.sum.dim_IntList %307, %309, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%311 = torch.aten.mul.Tensor %307, %306 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%312 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%313 = torch.aten.sum.dim_IntList %311, %312, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%314 = torch.aten.mul.Tensor %306, %313 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%315 = torch.aten.sub.Tensor %308, %310, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%316 = torch.aten.sub.Tensor %315, %314, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%317 = torch.aten.div.Tensor %result2_62, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%318 = torch.aten.mul.Tensor %317, %316 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%319 = torch.aten.mul.Tensor %303, %306 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%320 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%321 = torch.aten.sum.dim_IntList %319, %320, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%322 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%323 = torch.aten.sum.dim_IntList %303, %322, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%324 = torch.aten.mul.Tensor %318, %arg302 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%325 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%326 = torch.aten.view %324, %325 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%327 = torch.aten.t %arg300 : !torch.tensor -> !torch.tensor | |
%328 = torch.aten.mm %326, %327 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%329 = torch.aten.t %326 : !torch.tensor -> !torch.tensor | |
%330 = torch.aten.mm %329, %arg301 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%331 = torch.aten.t %330 : !torch.tensor -> !torch.tensor | |
%332 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%333 = torch.aten.sum.dim_IntList %326, %332, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%334 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%335 = torch.aten.view %333, %334 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%336 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%337 = torch.aten.view %328, %336 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%338 = torch.aten.t %331 : !torch.tensor -> !torch.tensor | |
%339 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%340 = torch.aten.view %337, %339 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%341 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%342 = torch.aten.permute %340, %341 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%343 = torch.aten.clone %342, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%344 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%345 = torch.aten._unsafe_view %343, %344 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%346 = torch.aten.transpose.int %arg298, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%347 = torch.aten.bmm %346, %345 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%348 = torch.aten.transpose.int %arg299, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%349 = torch.aten.bmm %345, %348 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%350 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%351 = torch.aten.view %347, %350 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%352 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%353 = torch.aten.view %349, %352 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%354 = torch.aten.mul.Tensor %353, %arg297 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%355 = torch.aten._softmax_backward_data %354, %arg296, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%356 = torch.aten.div.Tensor %355, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%357 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%358 = torch.aten.view %356, %357 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%359 = torch.aten.transpose.int %arg294, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%360 = torch.aten.bmm %359, %358 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%361 = torch.aten.transpose.int %arg295, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%362 = torch.aten.bmm %358, %361 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%363 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%364 = torch.aten.view %360, %363 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%365 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%366 = torch.aten.view %362, %365 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%367 = torch.aten.transpose.int %364, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%368 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%369 = torch.aten.permute %366, %368 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%370 = torch.aten.clone %369, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%371 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%372 = torch.aten._unsafe_view %370, %371 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%373 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%374 = torch.aten.permute %351, %373 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%375 = torch.aten.clone %374, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%376 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%377 = torch.aten._unsafe_view %375, %376 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%378 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%379 = torch.aten.view %377, %378 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%380 = torch.aten.t %arg292 : !torch.tensor -> !torch.tensor | |
%381 = torch.aten.mm %379, %380 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%382 = torch.aten.t %379 : !torch.tensor -> !torch.tensor | |
%383 = torch.aten.mm %382, %arg293 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%384 = torch.aten.t %383 : !torch.tensor -> !torch.tensor | |
%385 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%386 = torch.aten.sum.dim_IntList %379, %385, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%387 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%388 = torch.aten.view %386, %387 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%389 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%390 = torch.aten.view %381, %389 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%391 = torch.aten.add.Tensor %318, %390, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%392 = torch.aten.t %384 : !torch.tensor -> !torch.tensor | |
%393 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%394 = torch.aten.permute %367, %393 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%395 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%396 = torch.aten.view %394, %395 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%397 = torch.aten.clone %396, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%398 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%399 = torch.aten._unsafe_view %397, %398 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%400 = torch.aten.t %arg290 : !torch.tensor -> !torch.tensor | |
%401 = torch.aten.mm %399, %400 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%402 = torch.aten.t %399 : !torch.tensor -> !torch.tensor | |
%403 = torch.aten.mm %402, %arg291 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%404 = torch.aten.t %403 : !torch.tensor -> !torch.tensor | |
%405 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%406 = torch.aten.sum.dim_IntList %399, %405, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%407 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%408 = torch.aten.view %406, %407 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%409 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%410 = torch.aten.view %401, %409 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%411 = torch.aten.add.Tensor %391, %410, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%412 = torch.aten.t %404 : !torch.tensor -> !torch.tensor | |
%413 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%414 = torch.aten.view %372, %413 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%415 = torch.aten.t %arg288 : !torch.tensor -> !torch.tensor | |
%416 = torch.aten.mm %414, %415 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%417 = torch.aten.t %414 : !torch.tensor -> !torch.tensor | |
%418 = torch.aten.mm %417, %arg289 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%419 = torch.aten.t %418 : !torch.tensor -> !torch.tensor | |
%420 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%421 = torch.aten.sum.dim_IntList %414, %420, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%422 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%423 = torch.aten.view %421, %422 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%424 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%425 = torch.aten.view %416, %424 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%426 = torch.aten.add.Tensor %411, %425, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%427 = torch.aten.t %419 : !torch.tensor -> !torch.tensor | |
%428 = torch.aten.sub.Tensor %arg287, %result1_58, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%429 = torch.aten.mul.Tensor %428, %result2_59 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%430 = torch.aten.mul.Tensor %426, %arg50 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%431 = torch.aten.mul.Tensor %430, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%432 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%433 = torch.aten.sum.dim_IntList %430, %432, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%434 = torch.aten.mul.Tensor %430, %429 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%435 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%436 = torch.aten.sum.dim_IntList %434, %435, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%437 = torch.aten.mul.Tensor %429, %436 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%438 = torch.aten.sub.Tensor %431, %433, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%439 = torch.aten.sub.Tensor %438, %437, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%440 = torch.aten.div.Tensor %result2_59, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%441 = torch.aten.mul.Tensor %440, %439 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%442 = torch.aten.mul.Tensor %426, %429 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%443 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%444 = torch.aten.sum.dim_IntList %442, %443, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%445 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%446 = torch.aten.sum.dim_IntList %426, %445, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%447 = torch.aten.mul.Tensor %441, %arg286 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%448 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%449 = torch.aten.view %447, %448 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%450 = torch.aten.t %arg284 : !torch.tensor -> !torch.tensor | |
%451 = torch.aten.mm %449, %450 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%452 = torch.aten.t %449 : !torch.tensor -> !torch.tensor | |
%453 = torch.aten.mm %452, %arg285 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%454 = torch.aten.t %453 : !torch.tensor -> !torch.tensor | |
%455 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%456 = torch.aten.sum.dim_IntList %449, %455, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%457 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%458 = torch.aten.view %456, %457 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%459 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%460 = torch.aten.view %451, %459 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%461 = torch.aten.t %454 : !torch.tensor -> !torch.tensor | |
%462 = torch.aten.gelu_backward %460, %arg283, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%463 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%464 = torch.aten.view %462, %463 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%465 = torch.aten.t %arg281 : !torch.tensor -> !torch.tensor | |
%466 = torch.aten.mm %464, %465 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%467 = torch.aten.t %464 : !torch.tensor -> !torch.tensor | |
%468 = torch.aten.mm %467, %arg282 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%469 = torch.aten.t %468 : !torch.tensor -> !torch.tensor | |
%470 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%471 = torch.aten.sum.dim_IntList %464, %470, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%472 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%473 = torch.aten.view %471, %472 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%474 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%475 = torch.aten.view %466, %474 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%476 = torch.aten.add.Tensor %441, %475, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%477 = torch.aten.t %469 : !torch.tensor -> !torch.tensor | |
%478 = torch.aten.sub.Tensor %arg280, %result1_55, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%479 = torch.aten.mul.Tensor %478, %result2_56 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%480 = torch.aten.mul.Tensor %476, %arg48 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%481 = torch.aten.mul.Tensor %480, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%482 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%483 = torch.aten.sum.dim_IntList %480, %482, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%484 = torch.aten.mul.Tensor %480, %479 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%485 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%486 = torch.aten.sum.dim_IntList %484, %485, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%487 = torch.aten.mul.Tensor %479, %486 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%488 = torch.aten.sub.Tensor %481, %483, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%489 = torch.aten.sub.Tensor %488, %487, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%490 = torch.aten.div.Tensor %result2_56, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%491 = torch.aten.mul.Tensor %490, %489 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%492 = torch.aten.mul.Tensor %476, %479 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%493 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%494 = torch.aten.sum.dim_IntList %492, %493, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%495 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%496 = torch.aten.sum.dim_IntList %476, %495, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%497 = torch.aten.mul.Tensor %491, %arg279 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%498 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%499 = torch.aten.view %497, %498 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%500 = torch.aten.t %arg277 : !torch.tensor -> !torch.tensor | |
%501 = torch.aten.mm %499, %500 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%502 = torch.aten.t %499 : !torch.tensor -> !torch.tensor | |
%503 = torch.aten.mm %502, %arg278 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%504 = torch.aten.t %503 : !torch.tensor -> !torch.tensor | |
%505 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%506 = torch.aten.sum.dim_IntList %499, %505, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%507 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%508 = torch.aten.view %506, %507 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%509 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%510 = torch.aten.view %501, %509 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%511 = torch.aten.t %504 : !torch.tensor -> !torch.tensor | |
%512 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%513 = torch.aten.view %510, %512 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%514 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%515 = torch.aten.permute %513, %514 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%516 = torch.aten.clone %515, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%517 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%518 = torch.aten._unsafe_view %516, %517 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%519 = torch.aten.transpose.int %arg275, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%520 = torch.aten.bmm %519, %518 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%521 = torch.aten.transpose.int %arg276, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%522 = torch.aten.bmm %518, %521 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%523 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%524 = torch.aten.view %520, %523 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%525 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%526 = torch.aten.view %522, %525 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%527 = torch.aten.mul.Tensor %526, %arg274 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%528 = torch.aten._softmax_backward_data %527, %arg273, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%529 = torch.aten.div.Tensor %528, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%530 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%531 = torch.aten.view %529, %530 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%532 = torch.aten.transpose.int %arg271, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%533 = torch.aten.bmm %532, %531 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%534 = torch.aten.transpose.int %arg272, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%535 = torch.aten.bmm %531, %534 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%536 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%537 = torch.aten.view %533, %536 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%538 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%539 = torch.aten.view %535, %538 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%540 = torch.aten.transpose.int %537, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%541 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%542 = torch.aten.permute %539, %541 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%543 = torch.aten.clone %542, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%544 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%545 = torch.aten._unsafe_view %543, %544 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%546 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%547 = torch.aten.permute %524, %546 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%548 = torch.aten.clone %547, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%549 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%550 = torch.aten._unsafe_view %548, %549 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%551 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%552 = torch.aten.view %550, %551 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%553 = torch.aten.t %arg269 : !torch.tensor -> !torch.tensor | |
%554 = torch.aten.mm %552, %553 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%555 = torch.aten.t %552 : !torch.tensor -> !torch.tensor | |
%556 = torch.aten.mm %555, %arg270 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%557 = torch.aten.t %556 : !torch.tensor -> !torch.tensor | |
%558 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%559 = torch.aten.sum.dim_IntList %552, %558, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%560 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%561 = torch.aten.view %559, %560 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%562 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%563 = torch.aten.view %554, %562 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%564 = torch.aten.add.Tensor %491, %563, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%565 = torch.aten.t %557 : !torch.tensor -> !torch.tensor | |
%566 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%567 = torch.aten.permute %540, %566 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%568 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%569 = torch.aten.view %567, %568 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%570 = torch.aten.clone %569, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%571 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%572 = torch.aten._unsafe_view %570, %571 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%573 = torch.aten.t %arg267 : !torch.tensor -> !torch.tensor | |
%574 = torch.aten.mm %572, %573 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%575 = torch.aten.t %572 : !torch.tensor -> !torch.tensor | |
%576 = torch.aten.mm %575, %arg268 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%577 = torch.aten.t %576 : !torch.tensor -> !torch.tensor | |
%578 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%579 = torch.aten.sum.dim_IntList %572, %578, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%580 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%581 = torch.aten.view %579, %580 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%582 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%583 = torch.aten.view %574, %582 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%584 = torch.aten.add.Tensor %564, %583, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%585 = torch.aten.t %577 : !torch.tensor -> !torch.tensor | |
%586 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%587 = torch.aten.view %545, %586 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%588 = torch.aten.t %arg265 : !torch.tensor -> !torch.tensor | |
%589 = torch.aten.mm %587, %588 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%590 = torch.aten.t %587 : !torch.tensor -> !torch.tensor | |
%591 = torch.aten.mm %590, %arg266 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%592 = torch.aten.t %591 : !torch.tensor -> !torch.tensor | |
%593 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%594 = torch.aten.sum.dim_IntList %587, %593, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%595 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%596 = torch.aten.view %594, %595 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%597 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%598 = torch.aten.view %589, %597 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%599 = torch.aten.add.Tensor %584, %598, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%600 = torch.aten.t %592 : !torch.tensor -> !torch.tensor | |
%601 = torch.aten.sub.Tensor %arg264, %result1_52, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%602 = torch.aten.mul.Tensor %601, %result2_53 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%603 = torch.aten.mul.Tensor %599, %arg46 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%604 = torch.aten.mul.Tensor %603, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%605 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%606 = torch.aten.sum.dim_IntList %603, %605, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%607 = torch.aten.mul.Tensor %603, %602 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%608 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%609 = torch.aten.sum.dim_IntList %607, %608, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%610 = torch.aten.mul.Tensor %602, %609 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%611 = torch.aten.sub.Tensor %604, %606, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%612 = torch.aten.sub.Tensor %611, %610, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%613 = torch.aten.div.Tensor %result2_53, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%614 = torch.aten.mul.Tensor %613, %612 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%615 = torch.aten.mul.Tensor %599, %602 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%616 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%617 = torch.aten.sum.dim_IntList %615, %616, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%618 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%619 = torch.aten.sum.dim_IntList %599, %618, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%620 = torch.aten.mul.Tensor %614, %arg263 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%621 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%622 = torch.aten.view %620, %621 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%623 = torch.aten.t %arg261 : !torch.tensor -> !torch.tensor | |
%624 = torch.aten.mm %622, %623 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%625 = torch.aten.t %622 : !torch.tensor -> !torch.tensor | |
%626 = torch.aten.mm %625, %arg262 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%627 = torch.aten.t %626 : !torch.tensor -> !torch.tensor | |
%628 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%629 = torch.aten.sum.dim_IntList %622, %628, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%630 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%631 = torch.aten.view %629, %630 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%632 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%633 = torch.aten.view %624, %632 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%634 = torch.aten.t %627 : !torch.tensor -> !torch.tensor | |
%635 = torch.aten.gelu_backward %633, %arg260, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%636 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%637 = torch.aten.view %635, %636 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%638 = torch.aten.t %arg258 : !torch.tensor -> !torch.tensor | |
%639 = torch.aten.mm %637, %638 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%640 = torch.aten.t %637 : !torch.tensor -> !torch.tensor | |
%641 = torch.aten.mm %640, %arg259 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%642 = torch.aten.t %641 : !torch.tensor -> !torch.tensor | |
%643 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%644 = torch.aten.sum.dim_IntList %637, %643, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%645 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%646 = torch.aten.view %644, %645 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%647 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%648 = torch.aten.view %639, %647 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%649 = torch.aten.add.Tensor %614, %648, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%650 = torch.aten.t %642 : !torch.tensor -> !torch.tensor | |
%651 = torch.aten.sub.Tensor %arg257, %result1_49, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%652 = torch.aten.mul.Tensor %651, %result2_50 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%653 = torch.aten.mul.Tensor %649, %arg44 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%654 = torch.aten.mul.Tensor %653, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%655 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%656 = torch.aten.sum.dim_IntList %653, %655, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%657 = torch.aten.mul.Tensor %653, %652 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%658 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%659 = torch.aten.sum.dim_IntList %657, %658, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%660 = torch.aten.mul.Tensor %652, %659 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%661 = torch.aten.sub.Tensor %654, %656, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%662 = torch.aten.sub.Tensor %661, %660, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%663 = torch.aten.div.Tensor %result2_50, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%664 = torch.aten.mul.Tensor %663, %662 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%665 = torch.aten.mul.Tensor %649, %652 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%666 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%667 = torch.aten.sum.dim_IntList %665, %666, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%668 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%669 = torch.aten.sum.dim_IntList %649, %668, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%670 = torch.aten.mul.Tensor %664, %arg256 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%671 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%672 = torch.aten.view %670, %671 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%673 = torch.aten.t %arg254 : !torch.tensor -> !torch.tensor | |
%674 = torch.aten.mm %672, %673 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%675 = torch.aten.t %672 : !torch.tensor -> !torch.tensor | |
%676 = torch.aten.mm %675, %arg255 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%677 = torch.aten.t %676 : !torch.tensor -> !torch.tensor | |
%678 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%679 = torch.aten.sum.dim_IntList %672, %678, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%680 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%681 = torch.aten.view %679, %680 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%682 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%683 = torch.aten.view %674, %682 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%684 = torch.aten.t %677 : !torch.tensor -> !torch.tensor | |
%685 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%686 = torch.aten.view %683, %685 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%687 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%688 = torch.aten.permute %686, %687 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%689 = torch.aten.clone %688, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%690 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%691 = torch.aten._unsafe_view %689, %690 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%692 = torch.aten.transpose.int %arg252, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%693 = torch.aten.bmm %692, %691 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%694 = torch.aten.transpose.int %arg253, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%695 = torch.aten.bmm %691, %694 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%696 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%697 = torch.aten.view %693, %696 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%698 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%699 = torch.aten.view %695, %698 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%700 = torch.aten.mul.Tensor %699, %arg251 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%701 = torch.aten._softmax_backward_data %700, %arg250, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%702 = torch.aten.div.Tensor %701, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%703 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%704 = torch.aten.view %702, %703 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%705 = torch.aten.transpose.int %arg248, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%706 = torch.aten.bmm %705, %704 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%707 = torch.aten.transpose.int %arg249, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%708 = torch.aten.bmm %704, %707 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%709 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%710 = torch.aten.view %706, %709 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%711 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%712 = torch.aten.view %708, %711 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%713 = torch.aten.transpose.int %710, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%714 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%715 = torch.aten.permute %712, %714 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%716 = torch.aten.clone %715, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%717 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%718 = torch.aten._unsafe_view %716, %717 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%719 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%720 = torch.aten.permute %697, %719 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%721 = torch.aten.clone %720, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%722 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%723 = torch.aten._unsafe_view %721, %722 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%724 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%725 = torch.aten.view %723, %724 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%726 = torch.aten.t %arg246 : !torch.tensor -> !torch.tensor | |
%727 = torch.aten.mm %725, %726 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%728 = torch.aten.t %725 : !torch.tensor -> !torch.tensor | |
%729 = torch.aten.mm %728, %arg247 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%730 = torch.aten.t %729 : !torch.tensor -> !torch.tensor | |
%731 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%732 = torch.aten.sum.dim_IntList %725, %731, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%733 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%734 = torch.aten.view %732, %733 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%735 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%736 = torch.aten.view %727, %735 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%737 = torch.aten.add.Tensor %664, %736, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%738 = torch.aten.t %730 : !torch.tensor -> !torch.tensor | |
%739 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%740 = torch.aten.permute %713, %739 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%741 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%742 = torch.aten.view %740, %741 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%743 = torch.aten.clone %742, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%744 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%745 = torch.aten._unsafe_view %743, %744 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%746 = torch.aten.t %arg244 : !torch.tensor -> !torch.tensor | |
%747 = torch.aten.mm %745, %746 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%748 = torch.aten.t %745 : !torch.tensor -> !torch.tensor | |
%749 = torch.aten.mm %748, %arg245 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%750 = torch.aten.t %749 : !torch.tensor -> !torch.tensor | |
%751 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%752 = torch.aten.sum.dim_IntList %745, %751, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%753 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%754 = torch.aten.view %752, %753 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%755 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%756 = torch.aten.view %747, %755 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%757 = torch.aten.add.Tensor %737, %756, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%758 = torch.aten.t %750 : !torch.tensor -> !torch.tensor | |
%759 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%760 = torch.aten.view %718, %759 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%761 = torch.aten.t %arg242 : !torch.tensor -> !torch.tensor | |
%762 = torch.aten.mm %760, %761 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%763 = torch.aten.t %760 : !torch.tensor -> !torch.tensor | |
%764 = torch.aten.mm %763, %arg243 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%765 = torch.aten.t %764 : !torch.tensor -> !torch.tensor | |
%766 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%767 = torch.aten.sum.dim_IntList %760, %766, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%768 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%769 = torch.aten.view %767, %768 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%770 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%771 = torch.aten.view %762, %770 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%772 = torch.aten.add.Tensor %757, %771, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%773 = torch.aten.t %765 : !torch.tensor -> !torch.tensor | |
%774 = torch.aten.sub.Tensor %arg241, %result1_46, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%775 = torch.aten.mul.Tensor %774, %result2_47 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%776 = torch.aten.mul.Tensor %772, %arg42 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%777 = torch.aten.mul.Tensor %776, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%778 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%779 = torch.aten.sum.dim_IntList %776, %778, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%780 = torch.aten.mul.Tensor %776, %775 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%781 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%782 = torch.aten.sum.dim_IntList %780, %781, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%783 = torch.aten.mul.Tensor %775, %782 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%784 = torch.aten.sub.Tensor %777, %779, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%785 = torch.aten.sub.Tensor %784, %783, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%786 = torch.aten.div.Tensor %result2_47, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%787 = torch.aten.mul.Tensor %786, %785 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%788 = torch.aten.mul.Tensor %772, %775 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%789 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%790 = torch.aten.sum.dim_IntList %788, %789, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%791 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%792 = torch.aten.sum.dim_IntList %772, %791, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%793 = torch.aten.mul.Tensor %787, %arg240 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%794 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%795 = torch.aten.view %793, %794 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%796 = torch.aten.t %arg238 : !torch.tensor -> !torch.tensor | |
%797 = torch.aten.mm %795, %796 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%798 = torch.aten.t %795 : !torch.tensor -> !torch.tensor | |
%799 = torch.aten.mm %798, %arg239 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%800 = torch.aten.t %799 : !torch.tensor -> !torch.tensor | |
%801 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%802 = torch.aten.sum.dim_IntList %795, %801, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%803 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%804 = torch.aten.view %802, %803 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%805 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%806 = torch.aten.view %797, %805 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%807 = torch.aten.t %800 : !torch.tensor -> !torch.tensor | |
%808 = torch.aten.gelu_backward %806, %arg237, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%809 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%810 = torch.aten.view %808, %809 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%811 = torch.aten.t %arg235 : !torch.tensor -> !torch.tensor | |
%812 = torch.aten.mm %810, %811 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%813 = torch.aten.t %810 : !torch.tensor -> !torch.tensor | |
%814 = torch.aten.mm %813, %arg236 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%815 = torch.aten.t %814 : !torch.tensor -> !torch.tensor | |
%816 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%817 = torch.aten.sum.dim_IntList %810, %816, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%818 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%819 = torch.aten.view %817, %818 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%820 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%821 = torch.aten.view %812, %820 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%822 = torch.aten.add.Tensor %787, %821, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%823 = torch.aten.t %815 : !torch.tensor -> !torch.tensor | |
%824 = torch.aten.sub.Tensor %arg234, %result1_43, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%825 = torch.aten.mul.Tensor %824, %result2_44 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%826 = torch.aten.mul.Tensor %822, %arg40 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%827 = torch.aten.mul.Tensor %826, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%828 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%829 = torch.aten.sum.dim_IntList %826, %828, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%830 = torch.aten.mul.Tensor %826, %825 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%831 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%832 = torch.aten.sum.dim_IntList %830, %831, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%833 = torch.aten.mul.Tensor %825, %832 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%834 = torch.aten.sub.Tensor %827, %829, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%835 = torch.aten.sub.Tensor %834, %833, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%836 = torch.aten.div.Tensor %result2_44, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%837 = torch.aten.mul.Tensor %836, %835 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%838 = torch.aten.mul.Tensor %822, %825 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%839 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%840 = torch.aten.sum.dim_IntList %838, %839, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%841 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%842 = torch.aten.sum.dim_IntList %822, %841, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%843 = torch.aten.mul.Tensor %837, %arg233 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%844 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%845 = torch.aten.view %843, %844 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%846 = torch.aten.t %arg231 : !torch.tensor -> !torch.tensor | |
%847 = torch.aten.mm %845, %846 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%848 = torch.aten.t %845 : !torch.tensor -> !torch.tensor | |
%849 = torch.aten.mm %848, %arg232 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%850 = torch.aten.t %849 : !torch.tensor -> !torch.tensor | |
%851 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%852 = torch.aten.sum.dim_IntList %845, %851, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%853 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%854 = torch.aten.view %852, %853 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%855 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%856 = torch.aten.view %847, %855 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%857 = torch.aten.t %850 : !torch.tensor -> !torch.tensor | |
%858 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%859 = torch.aten.view %856, %858 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%860 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%861 = torch.aten.permute %859, %860 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%862 = torch.aten.clone %861, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%863 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%864 = torch.aten._unsafe_view %862, %863 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%865 = torch.aten.transpose.int %arg229, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%866 = torch.aten.bmm %865, %864 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%867 = torch.aten.transpose.int %arg230, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%868 = torch.aten.bmm %864, %867 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%869 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%870 = torch.aten.view %866, %869 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%871 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%872 = torch.aten.view %868, %871 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%873 = torch.aten.mul.Tensor %872, %arg228 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%874 = torch.aten._softmax_backward_data %873, %arg227, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%875 = torch.aten.div.Tensor %874, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%876 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%877 = torch.aten.view %875, %876 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%878 = torch.aten.transpose.int %arg225, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%879 = torch.aten.bmm %878, %877 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%880 = torch.aten.transpose.int %arg226, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%881 = torch.aten.bmm %877, %880 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%882 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%883 = torch.aten.view %879, %882 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%884 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%885 = torch.aten.view %881, %884 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%886 = torch.aten.transpose.int %883, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%887 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%888 = torch.aten.permute %885, %887 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%889 = torch.aten.clone %888, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%890 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%891 = torch.aten._unsafe_view %889, %890 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%892 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%893 = torch.aten.permute %870, %892 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%894 = torch.aten.clone %893, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%895 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%896 = torch.aten._unsafe_view %894, %895 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%897 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%898 = torch.aten.view %896, %897 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%899 = torch.aten.t %arg223 : !torch.tensor -> !torch.tensor | |
%900 = torch.aten.mm %898, %899 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%901 = torch.aten.t %898 : !torch.tensor -> !torch.tensor | |
%902 = torch.aten.mm %901, %arg224 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%903 = torch.aten.t %902 : !torch.tensor -> !torch.tensor | |
%904 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%905 = torch.aten.sum.dim_IntList %898, %904, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%906 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%907 = torch.aten.view %905, %906 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%908 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%909 = torch.aten.view %900, %908 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%910 = torch.aten.add.Tensor %837, %909, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%911 = torch.aten.t %903 : !torch.tensor -> !torch.tensor | |
%912 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%913 = torch.aten.permute %886, %912 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%914 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%915 = torch.aten.view %913, %914 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%916 = torch.aten.clone %915, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%917 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%918 = torch.aten._unsafe_view %916, %917 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%919 = torch.aten.t %arg221 : !torch.tensor -> !torch.tensor | |
%920 = torch.aten.mm %918, %919 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%921 = torch.aten.t %918 : !torch.tensor -> !torch.tensor | |
%922 = torch.aten.mm %921, %arg222 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%923 = torch.aten.t %922 : !torch.tensor -> !torch.tensor | |
%924 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%925 = torch.aten.sum.dim_IntList %918, %924, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%926 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%927 = torch.aten.view %925, %926 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%928 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%929 = torch.aten.view %920, %928 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%930 = torch.aten.add.Tensor %910, %929, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%931 = torch.aten.t %923 : !torch.tensor -> !torch.tensor | |
%932 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%933 = torch.aten.view %891, %932 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%934 = torch.aten.t %arg219 : !torch.tensor -> !torch.tensor | |
%935 = torch.aten.mm %933, %934 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%936 = torch.aten.t %933 : !torch.tensor -> !torch.tensor | |
%937 = torch.aten.mm %936, %arg220 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%938 = torch.aten.t %937 : !torch.tensor -> !torch.tensor | |
%939 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%940 = torch.aten.sum.dim_IntList %933, %939, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%941 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%942 = torch.aten.view %940, %941 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%943 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%944 = torch.aten.view %935, %943 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%945 = torch.aten.add.Tensor %930, %944, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%946 = torch.aten.t %938 : !torch.tensor -> !torch.tensor | |
%947 = torch.aten.sub.Tensor %arg218, %result1_40, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%948 = torch.aten.mul.Tensor %947, %result2_41 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%949 = torch.aten.mul.Tensor %945, %arg38 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%950 = torch.aten.mul.Tensor %949, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%951 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%952 = torch.aten.sum.dim_IntList %949, %951, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%953 = torch.aten.mul.Tensor %949, %948 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%954 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%955 = torch.aten.sum.dim_IntList %953, %954, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%956 = torch.aten.mul.Tensor %948, %955 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%957 = torch.aten.sub.Tensor %950, %952, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%958 = torch.aten.sub.Tensor %957, %956, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%959 = torch.aten.div.Tensor %result2_41, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%960 = torch.aten.mul.Tensor %959, %958 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%961 = torch.aten.mul.Tensor %945, %948 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%962 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%963 = torch.aten.sum.dim_IntList %961, %962, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%964 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%965 = torch.aten.sum.dim_IntList %945, %964, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%966 = torch.aten.mul.Tensor %960, %arg217 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%967 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%968 = torch.aten.view %966, %967 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%969 = torch.aten.t %arg215 : !torch.tensor -> !torch.tensor | |
%970 = torch.aten.mm %968, %969 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%971 = torch.aten.t %968 : !torch.tensor -> !torch.tensor | |
%972 = torch.aten.mm %971, %arg216 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%973 = torch.aten.t %972 : !torch.tensor -> !torch.tensor | |
%974 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%975 = torch.aten.sum.dim_IntList %968, %974, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%976 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%977 = torch.aten.view %975, %976 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%978 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%979 = torch.aten.view %970, %978 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%980 = torch.aten.t %973 : !torch.tensor -> !torch.tensor | |
%981 = torch.aten.gelu_backward %979, %arg214, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%982 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%983 = torch.aten.view %981, %982 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%984 = torch.aten.t %arg212 : !torch.tensor -> !torch.tensor | |
%985 = torch.aten.mm %983, %984 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%986 = torch.aten.t %983 : !torch.tensor -> !torch.tensor | |
%987 = torch.aten.mm %986, %arg213 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%988 = torch.aten.t %987 : !torch.tensor -> !torch.tensor | |
%989 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%990 = torch.aten.sum.dim_IntList %983, %989, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%991 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%992 = torch.aten.view %990, %991 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%993 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%994 = torch.aten.view %985, %993 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%995 = torch.aten.add.Tensor %960, %994, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%996 = torch.aten.t %988 : !torch.tensor -> !torch.tensor | |
%997 = torch.aten.sub.Tensor %arg211, %result1_37, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%998 = torch.aten.mul.Tensor %997, %result2_38 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%999 = torch.aten.mul.Tensor %995, %arg36 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1000 = torch.aten.mul.Tensor %999, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1001 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1002 = torch.aten.sum.dim_IntList %999, %1001, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1003 = torch.aten.mul.Tensor %999, %998 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1004 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1005 = torch.aten.sum.dim_IntList %1003, %1004, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1006 = torch.aten.mul.Tensor %998, %1005 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1007 = torch.aten.sub.Tensor %1000, %1002, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1008 = torch.aten.sub.Tensor %1007, %1006, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1009 = torch.aten.div.Tensor %result2_38, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1010 = torch.aten.mul.Tensor %1009, %1008 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1011 = torch.aten.mul.Tensor %995, %998 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1012 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1013 = torch.aten.sum.dim_IntList %1011, %1012, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1014 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1015 = torch.aten.sum.dim_IntList %995, %1014, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1016 = torch.aten.mul.Tensor %1010, %arg210 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1017 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1018 = torch.aten.view %1016, %1017 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1019 = torch.aten.t %arg208 : !torch.tensor -> !torch.tensor | |
%1020 = torch.aten.mm %1018, %1019 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1021 = torch.aten.t %1018 : !torch.tensor -> !torch.tensor | |
%1022 = torch.aten.mm %1021, %arg209 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1023 = torch.aten.t %1022 : !torch.tensor -> !torch.tensor | |
%1024 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1025 = torch.aten.sum.dim_IntList %1018, %1024, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1026 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1027 = torch.aten.view %1025, %1026 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1028 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1029 = torch.aten.view %1020, %1028 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1030 = torch.aten.t %1023 : !torch.tensor -> !torch.tensor | |
%1031 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1032 = torch.aten.view %1029, %1031 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1033 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1034 = torch.aten.permute %1032, %1033 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1035 = torch.aten.clone %1034, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1036 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1037 = torch.aten._unsafe_view %1035, %1036 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1038 = torch.aten.transpose.int %arg206, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1039 = torch.aten.bmm %1038, %1037 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1040 = torch.aten.transpose.int %arg207, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1041 = torch.aten.bmm %1037, %1040 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1042 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1043 = torch.aten.view %1039, %1042 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1044 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1045 = torch.aten.view %1041, %1044 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1046 = torch.aten.mul.Tensor %1045, %arg205 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1047 = torch.aten._softmax_backward_data %1046, %arg204, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1048 = torch.aten.div.Tensor %1047, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%1049 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1050 = torch.aten.view %1048, %1049 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1051 = torch.aten.transpose.int %arg202, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1052 = torch.aten.bmm %1051, %1050 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1053 = torch.aten.transpose.int %arg203, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1054 = torch.aten.bmm %1050, %1053 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1055 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1056 = torch.aten.view %1052, %1055 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1057 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1058 = torch.aten.view %1054, %1057 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1059 = torch.aten.transpose.int %1056, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1060 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1061 = torch.aten.permute %1058, %1060 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1062 = torch.aten.clone %1061, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1063 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1064 = torch.aten._unsafe_view %1062, %1063 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1065 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1066 = torch.aten.permute %1043, %1065 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1067 = torch.aten.clone %1066, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1068 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1069 = torch.aten._unsafe_view %1067, %1068 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1070 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1071 = torch.aten.view %1069, %1070 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1072 = torch.aten.t %arg200 : !torch.tensor -> !torch.tensor | |
%1073 = torch.aten.mm %1071, %1072 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1074 = torch.aten.t %1071 : !torch.tensor -> !torch.tensor | |
%1075 = torch.aten.mm %1074, %arg201 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1076 = torch.aten.t %1075 : !torch.tensor -> !torch.tensor | |
%1077 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1078 = torch.aten.sum.dim_IntList %1071, %1077, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1079 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1080 = torch.aten.view %1078, %1079 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1081 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1082 = torch.aten.view %1073, %1081 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1083 = torch.aten.add.Tensor %1010, %1082, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1084 = torch.aten.t %1076 : !torch.tensor -> !torch.tensor | |
%1085 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1086 = torch.aten.permute %1059, %1085 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1087 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1088 = torch.aten.view %1086, %1087 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1089 = torch.aten.clone %1088, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1090 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1091 = torch.aten._unsafe_view %1089, %1090 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1092 = torch.aten.t %arg198 : !torch.tensor -> !torch.tensor | |
%1093 = torch.aten.mm %1091, %1092 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1094 = torch.aten.t %1091 : !torch.tensor -> !torch.tensor | |
%1095 = torch.aten.mm %1094, %arg199 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1096 = torch.aten.t %1095 : !torch.tensor -> !torch.tensor | |
%1097 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1098 = torch.aten.sum.dim_IntList %1091, %1097, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1099 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1100 = torch.aten.view %1098, %1099 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1101 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1102 = torch.aten.view %1093, %1101 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1103 = torch.aten.add.Tensor %1083, %1102, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1104 = torch.aten.t %1096 : !torch.tensor -> !torch.tensor | |
%1105 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1106 = torch.aten.view %1064, %1105 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1107 = torch.aten.t %arg196 : !torch.tensor -> !torch.tensor | |
%1108 = torch.aten.mm %1106, %1107 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1109 = torch.aten.t %1106 : !torch.tensor -> !torch.tensor | |
%1110 = torch.aten.mm %1109, %arg197 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1111 = torch.aten.t %1110 : !torch.tensor -> !torch.tensor | |
%1112 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1113 = torch.aten.sum.dim_IntList %1106, %1112, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1114 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1115 = torch.aten.view %1113, %1114 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1116 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1117 = torch.aten.view %1108, %1116 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1118 = torch.aten.add.Tensor %1103, %1117, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1119 = torch.aten.t %1111 : !torch.tensor -> !torch.tensor | |
%1120 = torch.aten.sub.Tensor %arg195, %result1_34, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1121 = torch.aten.mul.Tensor %1120, %result2_35 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1122 = torch.aten.mul.Tensor %1118, %arg34 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1123 = torch.aten.mul.Tensor %1122, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1124 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1125 = torch.aten.sum.dim_IntList %1122, %1124, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1126 = torch.aten.mul.Tensor %1122, %1121 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1127 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1128 = torch.aten.sum.dim_IntList %1126, %1127, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1129 = torch.aten.mul.Tensor %1121, %1128 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1130 = torch.aten.sub.Tensor %1123, %1125, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1131 = torch.aten.sub.Tensor %1130, %1129, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1132 = torch.aten.div.Tensor %result2_35, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1133 = torch.aten.mul.Tensor %1132, %1131 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1134 = torch.aten.mul.Tensor %1118, %1121 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1135 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1136 = torch.aten.sum.dim_IntList %1134, %1135, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1137 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1138 = torch.aten.sum.dim_IntList %1118, %1137, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1139 = torch.aten.mul.Tensor %1133, %arg194 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1140 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1141 = torch.aten.view %1139, %1140 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1142 = torch.aten.t %arg192 : !torch.tensor -> !torch.tensor | |
%1143 = torch.aten.mm %1141, %1142 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1144 = torch.aten.t %1141 : !torch.tensor -> !torch.tensor | |
%1145 = torch.aten.mm %1144, %arg193 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1146 = torch.aten.t %1145 : !torch.tensor -> !torch.tensor | |
%1147 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1148 = torch.aten.sum.dim_IntList %1141, %1147, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1149 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1150 = torch.aten.view %1148, %1149 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1151 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1152 = torch.aten.view %1143, %1151 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1153 = torch.aten.t %1146 : !torch.tensor -> !torch.tensor | |
%1154 = torch.aten.gelu_backward %1152, %arg191, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%1155 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1156 = torch.aten.view %1154, %1155 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1157 = torch.aten.t %arg189 : !torch.tensor -> !torch.tensor | |
%1158 = torch.aten.mm %1156, %1157 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1159 = torch.aten.t %1156 : !torch.tensor -> !torch.tensor | |
%1160 = torch.aten.mm %1159, %arg190 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1161 = torch.aten.t %1160 : !torch.tensor -> !torch.tensor | |
%1162 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1163 = torch.aten.sum.dim_IntList %1156, %1162, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1164 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%1165 = torch.aten.view %1163, %1164 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1166 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1167 = torch.aten.view %1158, %1166 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1168 = torch.aten.add.Tensor %1133, %1167, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1169 = torch.aten.t %1161 : !torch.tensor -> !torch.tensor | |
%1170 = torch.aten.sub.Tensor %arg188, %result1_31, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1171 = torch.aten.mul.Tensor %1170, %result2_32 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1172 = torch.aten.mul.Tensor %1168, %arg32 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1173 = torch.aten.mul.Tensor %1172, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1174 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1175 = torch.aten.sum.dim_IntList %1172, %1174, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1176 = torch.aten.mul.Tensor %1172, %1171 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1177 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1178 = torch.aten.sum.dim_IntList %1176, %1177, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1179 = torch.aten.mul.Tensor %1171, %1178 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1180 = torch.aten.sub.Tensor %1173, %1175, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1181 = torch.aten.sub.Tensor %1180, %1179, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1182 = torch.aten.div.Tensor %result2_32, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1183 = torch.aten.mul.Tensor %1182, %1181 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1184 = torch.aten.mul.Tensor %1168, %1171 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1185 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1186 = torch.aten.sum.dim_IntList %1184, %1185, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1187 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1188 = torch.aten.sum.dim_IntList %1168, %1187, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1189 = torch.aten.mul.Tensor %1183, %arg187 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1190 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1191 = torch.aten.view %1189, %1190 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1192 = torch.aten.t %arg185 : !torch.tensor -> !torch.tensor | |
%1193 = torch.aten.mm %1191, %1192 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1194 = torch.aten.t %1191 : !torch.tensor -> !torch.tensor | |
%1195 = torch.aten.mm %1194, %arg186 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1196 = torch.aten.t %1195 : !torch.tensor -> !torch.tensor | |
%1197 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1198 = torch.aten.sum.dim_IntList %1191, %1197, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1199 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1200 = torch.aten.view %1198, %1199 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1201 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1202 = torch.aten.view %1193, %1201 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1203 = torch.aten.t %1196 : !torch.tensor -> !torch.tensor | |
%1204 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1205 = torch.aten.view %1202, %1204 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1206 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1207 = torch.aten.permute %1205, %1206 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1208 = torch.aten.clone %1207, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1209 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1210 = torch.aten._unsafe_view %1208, %1209 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1211 = torch.aten.transpose.int %arg183, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1212 = torch.aten.bmm %1211, %1210 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1213 = torch.aten.transpose.int %arg184, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1214 = torch.aten.bmm %1210, %1213 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1215 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1216 = torch.aten.view %1212, %1215 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1217 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1218 = torch.aten.view %1214, %1217 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1219 = torch.aten.mul.Tensor %1218, %arg182 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1220 = torch.aten._softmax_backward_data %1219, %arg181, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1221 = torch.aten.div.Tensor %1220, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%1222 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1223 = torch.aten.view %1221, %1222 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1224 = torch.aten.transpose.int %arg179, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1225 = torch.aten.bmm %1224, %1223 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1226 = torch.aten.transpose.int %arg180, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1227 = torch.aten.bmm %1223, %1226 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1228 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1229 = torch.aten.view %1225, %1228 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1230 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1231 = torch.aten.view %1227, %1230 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1232 = torch.aten.transpose.int %1229, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1233 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1234 = torch.aten.permute %1231, %1233 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1235 = torch.aten.clone %1234, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1236 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1237 = torch.aten._unsafe_view %1235, %1236 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1238 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1239 = torch.aten.permute %1216, %1238 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1240 = torch.aten.clone %1239, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1241 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1242 = torch.aten._unsafe_view %1240, %1241 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1243 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1244 = torch.aten.view %1242, %1243 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1245 = torch.aten.t %arg177 : !torch.tensor -> !torch.tensor | |
%1246 = torch.aten.mm %1244, %1245 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1247 = torch.aten.t %1244 : !torch.tensor -> !torch.tensor | |
%1248 = torch.aten.mm %1247, %arg178 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1249 = torch.aten.t %1248 : !torch.tensor -> !torch.tensor | |
%1250 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1251 = torch.aten.sum.dim_IntList %1244, %1250, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1252 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1253 = torch.aten.view %1251, %1252 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1254 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1255 = torch.aten.view %1246, %1254 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1256 = torch.aten.add.Tensor %1183, %1255, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1257 = torch.aten.t %1249 : !torch.tensor -> !torch.tensor | |
%1258 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1259 = torch.aten.permute %1232, %1258 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1260 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1261 = torch.aten.view %1259, %1260 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1262 = torch.aten.clone %1261, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1263 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1264 = torch.aten._unsafe_view %1262, %1263 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1265 = torch.aten.t %arg175 : !torch.tensor -> !torch.tensor | |
%1266 = torch.aten.mm %1264, %1265 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1267 = torch.aten.t %1264 : !torch.tensor -> !torch.tensor | |
%1268 = torch.aten.mm %1267, %arg176 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1269 = torch.aten.t %1268 : !torch.tensor -> !torch.tensor | |
%1270 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1271 = torch.aten.sum.dim_IntList %1264, %1270, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1272 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1273 = torch.aten.view %1271, %1272 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1274 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1275 = torch.aten.view %1266, %1274 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1276 = torch.aten.add.Tensor %1256, %1275, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1277 = torch.aten.t %1269 : !torch.tensor -> !torch.tensor | |
%1278 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1279 = torch.aten.view %1237, %1278 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1280 = torch.aten.t %arg173 : !torch.tensor -> !torch.tensor | |
%1281 = torch.aten.mm %1279, %1280 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1282 = torch.aten.t %1279 : !torch.tensor -> !torch.tensor | |
%1283 = torch.aten.mm %1282, %arg174 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1284 = torch.aten.t %1283 : !torch.tensor -> !torch.tensor | |
%1285 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1286 = torch.aten.sum.dim_IntList %1279, %1285, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1287 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1288 = torch.aten.view %1286, %1287 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1289 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1290 = torch.aten.view %1281, %1289 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1291 = torch.aten.add.Tensor %1276, %1290, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1292 = torch.aten.t %1284 : !torch.tensor -> !torch.tensor | |
%1293 = torch.aten.sub.Tensor %arg172, %result1_28, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1294 = torch.aten.mul.Tensor %1293, %result2_29 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1295 = torch.aten.mul.Tensor %1291, %arg30 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1296 = torch.aten.mul.Tensor %1295, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1297 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1298 = torch.aten.sum.dim_IntList %1295, %1297, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1299 = torch.aten.mul.Tensor %1295, %1294 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1300 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1301 = torch.aten.sum.dim_IntList %1299, %1300, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1302 = torch.aten.mul.Tensor %1294, %1301 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1303 = torch.aten.sub.Tensor %1296, %1298, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1304 = torch.aten.sub.Tensor %1303, %1302, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1305 = torch.aten.div.Tensor %result2_29, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1306 = torch.aten.mul.Tensor %1305, %1304 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1307 = torch.aten.mul.Tensor %1291, %1294 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1308 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1309 = torch.aten.sum.dim_IntList %1307, %1308, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1310 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1311 = torch.aten.sum.dim_IntList %1291, %1310, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1312 = torch.aten.mul.Tensor %1306, %arg171 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1313 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1314 = torch.aten.view %1312, %1313 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1315 = torch.aten.t %arg169 : !torch.tensor -> !torch.tensor | |
%1316 = torch.aten.mm %1314, %1315 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1317 = torch.aten.t %1314 : !torch.tensor -> !torch.tensor | |
%1318 = torch.aten.mm %1317, %arg170 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1319 = torch.aten.t %1318 : !torch.tensor -> !torch.tensor | |
%1320 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1321 = torch.aten.sum.dim_IntList %1314, %1320, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1322 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1323 = torch.aten.view %1321, %1322 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1324 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1325 = torch.aten.view %1316, %1324 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1326 = torch.aten.t %1319 : !torch.tensor -> !torch.tensor | |
%1327 = torch.aten.gelu_backward %1325, %arg168, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%1328 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1329 = torch.aten.view %1327, %1328 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1330 = torch.aten.t %arg166 : !torch.tensor -> !torch.tensor | |
%1331 = torch.aten.mm %1329, %1330 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1332 = torch.aten.t %1329 : !torch.tensor -> !torch.tensor | |
%1333 = torch.aten.mm %1332, %arg167 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1334 = torch.aten.t %1333 : !torch.tensor -> !torch.tensor | |
%1335 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1336 = torch.aten.sum.dim_IntList %1329, %1335, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1337 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%1338 = torch.aten.view %1336, %1337 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1339 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1340 = torch.aten.view %1331, %1339 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1341 = torch.aten.add.Tensor %1306, %1340, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1342 = torch.aten.t %1334 : !torch.tensor -> !torch.tensor | |
%1343 = torch.aten.sub.Tensor %arg165, %result1_25, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1344 = torch.aten.mul.Tensor %1343, %result2_26 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1345 = torch.aten.mul.Tensor %1341, %arg28 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1346 = torch.aten.mul.Tensor %1345, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1347 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1348 = torch.aten.sum.dim_IntList %1345, %1347, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1349 = torch.aten.mul.Tensor %1345, %1344 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1350 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1351 = torch.aten.sum.dim_IntList %1349, %1350, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1352 = torch.aten.mul.Tensor %1344, %1351 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1353 = torch.aten.sub.Tensor %1346, %1348, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1354 = torch.aten.sub.Tensor %1353, %1352, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1355 = torch.aten.div.Tensor %result2_26, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1356 = torch.aten.mul.Tensor %1355, %1354 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1357 = torch.aten.mul.Tensor %1341, %1344 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1358 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1359 = torch.aten.sum.dim_IntList %1357, %1358, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1360 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1361 = torch.aten.sum.dim_IntList %1341, %1360, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1362 = torch.aten.mul.Tensor %1356, %arg164 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1363 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1364 = torch.aten.view %1362, %1363 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1365 = torch.aten.t %arg162 : !torch.tensor -> !torch.tensor | |
%1366 = torch.aten.mm %1364, %1365 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1367 = torch.aten.t %1364 : !torch.tensor -> !torch.tensor | |
%1368 = torch.aten.mm %1367, %arg163 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1369 = torch.aten.t %1368 : !torch.tensor -> !torch.tensor | |
%1370 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1371 = torch.aten.sum.dim_IntList %1364, %1370, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1372 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1373 = torch.aten.view %1371, %1372 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1374 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1375 = torch.aten.view %1366, %1374 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1376 = torch.aten.t %1369 : !torch.tensor -> !torch.tensor | |
%1377 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1378 = torch.aten.view %1375, %1377 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1379 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1380 = torch.aten.permute %1378, %1379 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1381 = torch.aten.clone %1380, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1382 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1383 = torch.aten._unsafe_view %1381, %1382 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1384 = torch.aten.transpose.int %arg160, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1385 = torch.aten.bmm %1384, %1383 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1386 = torch.aten.transpose.int %arg161, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1387 = torch.aten.bmm %1383, %1386 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1388 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1389 = torch.aten.view %1385, %1388 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1390 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1391 = torch.aten.view %1387, %1390 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1392 = torch.aten.mul.Tensor %1391, %arg159 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1393 = torch.aten._softmax_backward_data %1392, %arg158, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1394 = torch.aten.div.Tensor %1393, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%1395 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1396 = torch.aten.view %1394, %1395 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1397 = torch.aten.transpose.int %arg156, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1398 = torch.aten.bmm %1397, %1396 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1399 = torch.aten.transpose.int %arg157, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1400 = torch.aten.bmm %1396, %1399 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1401 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1402 = torch.aten.view %1398, %1401 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1403 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1404 = torch.aten.view %1400, %1403 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1405 = torch.aten.transpose.int %1402, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1406 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1407 = torch.aten.permute %1404, %1406 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1408 = torch.aten.clone %1407, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1409 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1410 = torch.aten._unsafe_view %1408, %1409 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1411 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1412 = torch.aten.permute %1389, %1411 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1413 = torch.aten.clone %1412, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1414 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1415 = torch.aten._unsafe_view %1413, %1414 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1416 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1417 = torch.aten.view %1415, %1416 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1418 = torch.aten.t %arg154 : !torch.tensor -> !torch.tensor | |
%1419 = torch.aten.mm %1417, %1418 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1420 = torch.aten.t %1417 : !torch.tensor -> !torch.tensor | |
%1421 = torch.aten.mm %1420, %arg155 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1422 = torch.aten.t %1421 : !torch.tensor -> !torch.tensor | |
%1423 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1424 = torch.aten.sum.dim_IntList %1417, %1423, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1425 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1426 = torch.aten.view %1424, %1425 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1427 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1428 = torch.aten.view %1419, %1427 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1429 = torch.aten.add.Tensor %1356, %1428, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1430 = torch.aten.t %1422 : !torch.tensor -> !torch.tensor | |
%1431 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1432 = torch.aten.permute %1405, %1431 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1433 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1434 = torch.aten.view %1432, %1433 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1435 = torch.aten.clone %1434, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1436 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1437 = torch.aten._unsafe_view %1435, %1436 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1438 = torch.aten.t %arg152 : !torch.tensor -> !torch.tensor | |
%1439 = torch.aten.mm %1437, %1438 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1440 = torch.aten.t %1437 : !torch.tensor -> !torch.tensor | |
%1441 = torch.aten.mm %1440, %arg153 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1442 = torch.aten.t %1441 : !torch.tensor -> !torch.tensor | |
%1443 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1444 = torch.aten.sum.dim_IntList %1437, %1443, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1445 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1446 = torch.aten.view %1444, %1445 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1447 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1448 = torch.aten.view %1439, %1447 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1449 = torch.aten.add.Tensor %1429, %1448, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1450 = torch.aten.t %1442 : !torch.tensor -> !torch.tensor | |
%1451 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1452 = torch.aten.view %1410, %1451 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1453 = torch.aten.t %arg150 : !torch.tensor -> !torch.tensor | |
%1454 = torch.aten.mm %1452, %1453 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1455 = torch.aten.t %1452 : !torch.tensor -> !torch.tensor | |
%1456 = torch.aten.mm %1455, %arg151 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1457 = torch.aten.t %1456 : !torch.tensor -> !torch.tensor | |
%1458 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1459 = torch.aten.sum.dim_IntList %1452, %1458, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1460 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1461 = torch.aten.view %1459, %1460 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1462 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1463 = torch.aten.view %1454, %1462 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1464 = torch.aten.add.Tensor %1449, %1463, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1465 = torch.aten.t %1457 : !torch.tensor -> !torch.tensor | |
%1466 = torch.aten.sub.Tensor %arg149, %result1_22, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1467 = torch.aten.mul.Tensor %1466, %result2_23 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1468 = torch.aten.mul.Tensor %1464, %arg26 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1469 = torch.aten.mul.Tensor %1468, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1470 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1471 = torch.aten.sum.dim_IntList %1468, %1470, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1472 = torch.aten.mul.Tensor %1468, %1467 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1473 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1474 = torch.aten.sum.dim_IntList %1472, %1473, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1475 = torch.aten.mul.Tensor %1467, %1474 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1476 = torch.aten.sub.Tensor %1469, %1471, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1477 = torch.aten.sub.Tensor %1476, %1475, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1478 = torch.aten.div.Tensor %result2_23, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1479 = torch.aten.mul.Tensor %1478, %1477 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1480 = torch.aten.mul.Tensor %1464, %1467 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1481 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1482 = torch.aten.sum.dim_IntList %1480, %1481, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1483 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1484 = torch.aten.sum.dim_IntList %1464, %1483, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1485 = torch.aten.mul.Tensor %1479, %arg148 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1486 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1487 = torch.aten.view %1485, %1486 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1488 = torch.aten.t %arg146 : !torch.tensor -> !torch.tensor | |
%1489 = torch.aten.mm %1487, %1488 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1490 = torch.aten.t %1487 : !torch.tensor -> !torch.tensor | |
%1491 = torch.aten.mm %1490, %arg147 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1492 = torch.aten.t %1491 : !torch.tensor -> !torch.tensor | |
%1493 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1494 = torch.aten.sum.dim_IntList %1487, %1493, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1495 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1496 = torch.aten.view %1494, %1495 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1497 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1498 = torch.aten.view %1489, %1497 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1499 = torch.aten.t %1492 : !torch.tensor -> !torch.tensor | |
%1500 = torch.aten.gelu_backward %1498, %arg145, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%1501 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1502 = torch.aten.view %1500, %1501 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1503 = torch.aten.t %arg143 : !torch.tensor -> !torch.tensor | |
%1504 = torch.aten.mm %1502, %1503 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1505 = torch.aten.t %1502 : !torch.tensor -> !torch.tensor | |
%1506 = torch.aten.mm %1505, %arg144 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1507 = torch.aten.t %1506 : !torch.tensor -> !torch.tensor | |
%1508 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1509 = torch.aten.sum.dim_IntList %1502, %1508, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1510 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%1511 = torch.aten.view %1509, %1510 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1512 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1513 = torch.aten.view %1504, %1512 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1514 = torch.aten.add.Tensor %1479, %1513, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1515 = torch.aten.t %1507 : !torch.tensor -> !torch.tensor | |
%1516 = torch.aten.sub.Tensor %arg142, %result1_19, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1517 = torch.aten.mul.Tensor %1516, %result2_20 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1518 = torch.aten.mul.Tensor %1514, %arg24 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1519 = torch.aten.mul.Tensor %1518, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1520 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1521 = torch.aten.sum.dim_IntList %1518, %1520, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1522 = torch.aten.mul.Tensor %1518, %1517 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1523 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1524 = torch.aten.sum.dim_IntList %1522, %1523, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1525 = torch.aten.mul.Tensor %1517, %1524 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1526 = torch.aten.sub.Tensor %1519, %1521, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1527 = torch.aten.sub.Tensor %1526, %1525, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1528 = torch.aten.div.Tensor %result2_20, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1529 = torch.aten.mul.Tensor %1528, %1527 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1530 = torch.aten.mul.Tensor %1514, %1517 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1531 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1532 = torch.aten.sum.dim_IntList %1530, %1531, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1533 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1534 = torch.aten.sum.dim_IntList %1514, %1533, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1535 = torch.aten.mul.Tensor %1529, %arg141 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1536 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1537 = torch.aten.view %1535, %1536 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1538 = torch.aten.t %arg139 : !torch.tensor -> !torch.tensor | |
%1539 = torch.aten.mm %1537, %1538 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1540 = torch.aten.t %1537 : !torch.tensor -> !torch.tensor | |
%1541 = torch.aten.mm %1540, %arg140 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1542 = torch.aten.t %1541 : !torch.tensor -> !torch.tensor | |
%1543 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1544 = torch.aten.sum.dim_IntList %1537, %1543, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1545 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1546 = torch.aten.view %1544, %1545 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1547 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1548 = torch.aten.view %1539, %1547 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1549 = torch.aten.t %1542 : !torch.tensor -> !torch.tensor | |
%1550 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1551 = torch.aten.view %1548, %1550 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1552 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1553 = torch.aten.permute %1551, %1552 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1554 = torch.aten.clone %1553, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1555 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1556 = torch.aten._unsafe_view %1554, %1555 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1557 = torch.aten.transpose.int %arg137, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1558 = torch.aten.bmm %1557, %1556 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1559 = torch.aten.transpose.int %arg138, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1560 = torch.aten.bmm %1556, %1559 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1561 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1562 = torch.aten.view %1558, %1561 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1563 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1564 = torch.aten.view %1560, %1563 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1565 = torch.aten.mul.Tensor %1564, %arg136 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1566 = torch.aten._softmax_backward_data %1565, %arg135, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1567 = torch.aten.div.Tensor %1566, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%1568 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1569 = torch.aten.view %1567, %1568 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1570 = torch.aten.transpose.int %arg133, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1571 = torch.aten.bmm %1570, %1569 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1572 = torch.aten.transpose.int %arg134, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1573 = torch.aten.bmm %1569, %1572 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1574 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1575 = torch.aten.view %1571, %1574 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1576 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1577 = torch.aten.view %1573, %1576 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1578 = torch.aten.transpose.int %1575, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1579 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1580 = torch.aten.permute %1577, %1579 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1581 = torch.aten.clone %1580, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1582 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1583 = torch.aten._unsafe_view %1581, %1582 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1584 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1585 = torch.aten.permute %1562, %1584 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1586 = torch.aten.clone %1585, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1587 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1588 = torch.aten._unsafe_view %1586, %1587 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1589 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1590 = torch.aten.view %1588, %1589 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1591 = torch.aten.t %arg131 : !torch.tensor -> !torch.tensor | |
%1592 = torch.aten.mm %1590, %1591 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1593 = torch.aten.t %1590 : !torch.tensor -> !torch.tensor | |
%1594 = torch.aten.mm %1593, %arg132 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1595 = torch.aten.t %1594 : !torch.tensor -> !torch.tensor | |
%1596 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1597 = torch.aten.sum.dim_IntList %1590, %1596, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1598 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1599 = torch.aten.view %1597, %1598 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1600 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1601 = torch.aten.view %1592, %1600 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1602 = torch.aten.add.Tensor %1529, %1601, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1603 = torch.aten.t %1595 : !torch.tensor -> !torch.tensor | |
%1604 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1605 = torch.aten.permute %1578, %1604 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1606 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1607 = torch.aten.view %1605, %1606 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1608 = torch.aten.clone %1607, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1609 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1610 = torch.aten._unsafe_view %1608, %1609 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1611 = torch.aten.t %arg129 : !torch.tensor -> !torch.tensor | |
%1612 = torch.aten.mm %1610, %1611 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1613 = torch.aten.t %1610 : !torch.tensor -> !torch.tensor | |
%1614 = torch.aten.mm %1613, %arg130 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1615 = torch.aten.t %1614 : !torch.tensor -> !torch.tensor | |
%1616 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1617 = torch.aten.sum.dim_IntList %1610, %1616, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1618 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1619 = torch.aten.view %1617, %1618 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1620 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1621 = torch.aten.view %1612, %1620 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1622 = torch.aten.add.Tensor %1602, %1621, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1623 = torch.aten.t %1615 : !torch.tensor -> !torch.tensor | |
%1624 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1625 = torch.aten.view %1583, %1624 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1626 = torch.aten.t %arg127 : !torch.tensor -> !torch.tensor | |
%1627 = torch.aten.mm %1625, %1626 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1628 = torch.aten.t %1625 : !torch.tensor -> !torch.tensor | |
%1629 = torch.aten.mm %1628, %arg128 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1630 = torch.aten.t %1629 : !torch.tensor -> !torch.tensor | |
%1631 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1632 = torch.aten.sum.dim_IntList %1625, %1631, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1633 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1634 = torch.aten.view %1632, %1633 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1635 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1636 = torch.aten.view %1627, %1635 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1637 = torch.aten.add.Tensor %1622, %1636, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1638 = torch.aten.t %1630 : !torch.tensor -> !torch.tensor | |
%1639 = torch.aten.sub.Tensor %arg126, %result1_16, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1640 = torch.aten.mul.Tensor %1639, %result2_17 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1641 = torch.aten.mul.Tensor %1637, %arg22 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1642 = torch.aten.mul.Tensor %1641, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1643 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1644 = torch.aten.sum.dim_IntList %1641, %1643, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1645 = torch.aten.mul.Tensor %1641, %1640 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1646 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1647 = torch.aten.sum.dim_IntList %1645, %1646, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1648 = torch.aten.mul.Tensor %1640, %1647 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1649 = torch.aten.sub.Tensor %1642, %1644, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1650 = torch.aten.sub.Tensor %1649, %1648, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1651 = torch.aten.div.Tensor %result2_17, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1652 = torch.aten.mul.Tensor %1651, %1650 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1653 = torch.aten.mul.Tensor %1637, %1640 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1654 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1655 = torch.aten.sum.dim_IntList %1653, %1654, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1656 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1657 = torch.aten.sum.dim_IntList %1637, %1656, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1658 = torch.aten.mul.Tensor %1652, %arg125 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1659 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1660 = torch.aten.view %1658, %1659 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1661 = torch.aten.t %arg123 : !torch.tensor -> !torch.tensor | |
%1662 = torch.aten.mm %1660, %1661 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1663 = torch.aten.t %1660 : !torch.tensor -> !torch.tensor | |
%1664 = torch.aten.mm %1663, %arg124 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1665 = torch.aten.t %1664 : !torch.tensor -> !torch.tensor | |
%1666 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1667 = torch.aten.sum.dim_IntList %1660, %1666, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1668 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1669 = torch.aten.view %1667, %1668 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1670 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1671 = torch.aten.view %1662, %1670 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1672 = torch.aten.t %1665 : !torch.tensor -> !torch.tensor | |
%1673 = torch.aten.gelu_backward %1671, %arg122, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%1674 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1675 = torch.aten.view %1673, %1674 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1676 = torch.aten.t %arg120 : !torch.tensor -> !torch.tensor | |
%1677 = torch.aten.mm %1675, %1676 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1678 = torch.aten.t %1675 : !torch.tensor -> !torch.tensor | |
%1679 = torch.aten.mm %1678, %arg121 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1680 = torch.aten.t %1679 : !torch.tensor -> !torch.tensor | |
%1681 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1682 = torch.aten.sum.dim_IntList %1675, %1681, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1683 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%1684 = torch.aten.view %1682, %1683 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1685 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1686 = torch.aten.view %1677, %1685 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1687 = torch.aten.add.Tensor %1652, %1686, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1688 = torch.aten.t %1680 : !torch.tensor -> !torch.tensor | |
%1689 = torch.aten.sub.Tensor %arg119, %result1_13, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1690 = torch.aten.mul.Tensor %1689, %result2_14 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1691 = torch.aten.mul.Tensor %1687, %arg20 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1692 = torch.aten.mul.Tensor %1691, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1693 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1694 = torch.aten.sum.dim_IntList %1691, %1693, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1695 = torch.aten.mul.Tensor %1691, %1690 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1696 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1697 = torch.aten.sum.dim_IntList %1695, %1696, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1698 = torch.aten.mul.Tensor %1690, %1697 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1699 = torch.aten.sub.Tensor %1692, %1694, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1700 = torch.aten.sub.Tensor %1699, %1698, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1701 = torch.aten.div.Tensor %result2_14, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1702 = torch.aten.mul.Tensor %1701, %1700 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1703 = torch.aten.mul.Tensor %1687, %1690 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1704 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1705 = torch.aten.sum.dim_IntList %1703, %1704, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1706 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1707 = torch.aten.sum.dim_IntList %1687, %1706, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1708 = torch.aten.mul.Tensor %1702, %arg118 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1709 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1710 = torch.aten.view %1708, %1709 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1711 = torch.aten.t %arg116 : !torch.tensor -> !torch.tensor | |
%1712 = torch.aten.mm %1710, %1711 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1713 = torch.aten.t %1710 : !torch.tensor -> !torch.tensor | |
%1714 = torch.aten.mm %1713, %arg117 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1715 = torch.aten.t %1714 : !torch.tensor -> !torch.tensor | |
%1716 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1717 = torch.aten.sum.dim_IntList %1710, %1716, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1718 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1719 = torch.aten.view %1717, %1718 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1720 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1721 = torch.aten.view %1712, %1720 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1722 = torch.aten.t %1715 : !torch.tensor -> !torch.tensor | |
%1723 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1724 = torch.aten.view %1721, %1723 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1725 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1726 = torch.aten.permute %1724, %1725 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1727 = torch.aten.clone %1726, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1728 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1729 = torch.aten._unsafe_view %1727, %1728 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1730 = torch.aten.transpose.int %arg114, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1731 = torch.aten.bmm %1730, %1729 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1732 = torch.aten.transpose.int %arg115, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1733 = torch.aten.bmm %1729, %1732 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1734 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1735 = torch.aten.view %1731, %1734 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1736 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1737 = torch.aten.view %1733, %1736 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1738 = torch.aten.mul.Tensor %1737, %arg113 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1739 = torch.aten._softmax_backward_data %1738, %arg112, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1740 = torch.aten.div.Tensor %1739, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%1741 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1742 = torch.aten.view %1740, %1741 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1743 = torch.aten.transpose.int %arg110, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1744 = torch.aten.bmm %1743, %1742 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1745 = torch.aten.transpose.int %arg111, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1746 = torch.aten.bmm %1742, %1745 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1747 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1748 = torch.aten.view %1744, %1747 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1749 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1750 = torch.aten.view %1746, %1749 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1751 = torch.aten.transpose.int %1748, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1752 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1753 = torch.aten.permute %1750, %1752 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1754 = torch.aten.clone %1753, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1755 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1756 = torch.aten._unsafe_view %1754, %1755 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1757 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1758 = torch.aten.permute %1735, %1757 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1759 = torch.aten.clone %1758, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1760 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1761 = torch.aten._unsafe_view %1759, %1760 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1762 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1763 = torch.aten.view %1761, %1762 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1764 = torch.aten.t %arg108 : !torch.tensor -> !torch.tensor | |
%1765 = torch.aten.mm %1763, %1764 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1766 = torch.aten.t %1763 : !torch.tensor -> !torch.tensor | |
%1767 = torch.aten.mm %1766, %arg109 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1768 = torch.aten.t %1767 : !torch.tensor -> !torch.tensor | |
%1769 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1770 = torch.aten.sum.dim_IntList %1763, %1769, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1771 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1772 = torch.aten.view %1770, %1771 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1773 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1774 = torch.aten.view %1765, %1773 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1775 = torch.aten.add.Tensor %1702, %1774, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1776 = torch.aten.t %1768 : !torch.tensor -> !torch.tensor | |
%1777 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1778 = torch.aten.permute %1751, %1777 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1779 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1780 = torch.aten.view %1778, %1779 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1781 = torch.aten.clone %1780, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1782 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1783 = torch.aten._unsafe_view %1781, %1782 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1784 = torch.aten.t %arg106 : !torch.tensor -> !torch.tensor | |
%1785 = torch.aten.mm %1783, %1784 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1786 = torch.aten.t %1783 : !torch.tensor -> !torch.tensor | |
%1787 = torch.aten.mm %1786, %arg107 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1788 = torch.aten.t %1787 : !torch.tensor -> !torch.tensor | |
%1789 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1790 = torch.aten.sum.dim_IntList %1783, %1789, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1791 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1792 = torch.aten.view %1790, %1791 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1793 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1794 = torch.aten.view %1785, %1793 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1795 = torch.aten.add.Tensor %1775, %1794, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1796 = torch.aten.t %1788 : !torch.tensor -> !torch.tensor | |
%1797 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1798 = torch.aten.view %1756, %1797 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1799 = torch.aten.t %arg104 : !torch.tensor -> !torch.tensor | |
%1800 = torch.aten.mm %1798, %1799 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1801 = torch.aten.t %1798 : !torch.tensor -> !torch.tensor | |
%1802 = torch.aten.mm %1801, %arg105 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1803 = torch.aten.t %1802 : !torch.tensor -> !torch.tensor | |
%1804 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1805 = torch.aten.sum.dim_IntList %1798, %1804, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1806 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1807 = torch.aten.view %1805, %1806 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1808 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1809 = torch.aten.view %1800, %1808 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1810 = torch.aten.add.Tensor %1795, %1809, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1811 = torch.aten.t %1803 : !torch.tensor -> !torch.tensor | |
%1812 = torch.aten.sub.Tensor %arg103, %result1_10, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1813 = torch.aten.mul.Tensor %1812, %result2_11 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1814 = torch.aten.mul.Tensor %1810, %arg10 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1815 = torch.aten.mul.Tensor %1814, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1816 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1817 = torch.aten.sum.dim_IntList %1814, %1816, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1818 = torch.aten.mul.Tensor %1814, %1813 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1819 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1820 = torch.aten.sum.dim_IntList %1818, %1819, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1821 = torch.aten.mul.Tensor %1813, %1820 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1822 = torch.aten.sub.Tensor %1815, %1817, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1823 = torch.aten.sub.Tensor %1822, %1821, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1824 = torch.aten.div.Tensor %result2_11, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1825 = torch.aten.mul.Tensor %1824, %1823 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1826 = torch.aten.mul.Tensor %1810, %1813 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1827 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1828 = torch.aten.sum.dim_IntList %1826, %1827, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1829 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1830 = torch.aten.sum.dim_IntList %1810, %1829, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1831 = torch.aten.mul.Tensor %1825, %arg102 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1832 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1833 = torch.aten.view %1831, %1832 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1834 = torch.aten.t %arg100 : !torch.tensor -> !torch.tensor | |
%1835 = torch.aten.mm %1833, %1834 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1836 = torch.aten.t %1833 : !torch.tensor -> !torch.tensor | |
%1837 = torch.aten.mm %1836, %arg101 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1838 = torch.aten.t %1837 : !torch.tensor -> !torch.tensor | |
%1839 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1840 = torch.aten.sum.dim_IntList %1833, %1839, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1841 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1842 = torch.aten.view %1840, %1841 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1843 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1844 = torch.aten.view %1835, %1843 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1845 = torch.aten.t %1838 : !torch.tensor -> !torch.tensor | |
%1846 = torch.aten.gelu_backward %1844, %arg99, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%1847 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1848 = torch.aten.view %1846, %1847 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1849 = torch.aten.t %arg97 : !torch.tensor -> !torch.tensor | |
%1850 = torch.aten.mm %1848, %1849 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1851 = torch.aten.t %1848 : !torch.tensor -> !torch.tensor | |
%1852 = torch.aten.mm %1851, %arg98 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1853 = torch.aten.t %1852 : !torch.tensor -> !torch.tensor | |
%1854 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1855 = torch.aten.sum.dim_IntList %1848, %1854, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1856 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%1857 = torch.aten.view %1855, %1856 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1858 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1859 = torch.aten.view %1850, %1858 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1860 = torch.aten.add.Tensor %1825, %1859, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1861 = torch.aten.t %1853 : !torch.tensor -> !torch.tensor | |
%1862 = torch.aten.sub.Tensor %arg96, %result1_7, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1863 = torch.aten.mul.Tensor %1862, %result2_8 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1864 = torch.aten.mul.Tensor %1860, %arg8 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1865 = torch.aten.mul.Tensor %1864, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1866 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1867 = torch.aten.sum.dim_IntList %1864, %1866, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1868 = torch.aten.mul.Tensor %1864, %1863 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1869 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1870 = torch.aten.sum.dim_IntList %1868, %1869, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1871 = torch.aten.mul.Tensor %1863, %1870 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1872 = torch.aten.sub.Tensor %1865, %1867, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1873 = torch.aten.sub.Tensor %1872, %1871, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1874 = torch.aten.div.Tensor %result2_8, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1875 = torch.aten.mul.Tensor %1874, %1873 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1876 = torch.aten.mul.Tensor %1860, %1863 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1877 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1878 = torch.aten.sum.dim_IntList %1876, %1877, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1879 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1880 = torch.aten.sum.dim_IntList %1860, %1879, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1881 = torch.aten.mul.Tensor %1875, %arg95 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1882 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1883 = torch.aten.view %1881, %1882 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1884 = torch.aten.t %arg93 : !torch.tensor -> !torch.tensor | |
%1885 = torch.aten.mm %1883, %1884 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1886 = torch.aten.t %1883 : !torch.tensor -> !torch.tensor | |
%1887 = torch.aten.mm %1886, %arg94 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1888 = torch.aten.t %1887 : !torch.tensor -> !torch.tensor | |
%1889 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1890 = torch.aten.sum.dim_IntList %1883, %1889, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1891 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1892 = torch.aten.view %1890, %1891 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1893 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1894 = torch.aten.view %1885, %1893 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1895 = torch.aten.t %1888 : !torch.tensor -> !torch.tensor | |
%1896 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1897 = torch.aten.view %1894, %1896 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1898 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1899 = torch.aten.permute %1897, %1898 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1900 = torch.aten.clone %1899, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1901 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1902 = torch.aten._unsafe_view %1900, %1901 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1903 = torch.aten.transpose.int %arg91, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1904 = torch.aten.bmm %1903, %1902 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1905 = torch.aten.transpose.int %arg92, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1906 = torch.aten.bmm %1902, %1905 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1907 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1908 = torch.aten.view %1904, %1907 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1909 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1910 = torch.aten.view %1906, %1909 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1911 = torch.aten.mul.Tensor %1910, %arg90 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1912 = torch.aten._softmax_backward_data %1911, %arg89, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1913 = torch.aten.div.Tensor %1912, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%1914 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1915 = torch.aten.view %1913, %1914 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1916 = torch.aten.transpose.int %arg87, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1917 = torch.aten.bmm %1916, %1915 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1918 = torch.aten.transpose.int %arg88, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1919 = torch.aten.bmm %1915, %1918 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1920 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1921 = torch.aten.view %1917, %1920 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1922 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1923 = torch.aten.view %1919, %1922 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1924 = torch.aten.transpose.int %1921, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%1925 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1926 = torch.aten.permute %1923, %1925 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1927 = torch.aten.clone %1926, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1928 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1929 = torch.aten._unsafe_view %1927, %1928 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1930 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1931 = torch.aten.permute %1908, %1930 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1932 = torch.aten.clone %1931, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1933 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1934 = torch.aten._unsafe_view %1932, %1933 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1935 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1936 = torch.aten.view %1934, %1935 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1937 = torch.aten.t %arg85 : !torch.tensor -> !torch.tensor | |
%1938 = torch.aten.mm %1936, %1937 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1939 = torch.aten.t %1936 : !torch.tensor -> !torch.tensor | |
%1940 = torch.aten.mm %1939, %arg86 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1941 = torch.aten.t %1940 : !torch.tensor -> !torch.tensor | |
%1942 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1943 = torch.aten.sum.dim_IntList %1936, %1942, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1944 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1945 = torch.aten.view %1943, %1944 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1946 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1947 = torch.aten.view %1938, %1946 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1948 = torch.aten.add.Tensor %1875, %1947, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1949 = torch.aten.t %1941 : !torch.tensor -> !torch.tensor | |
%1950 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1951 = torch.aten.permute %1924, %1950 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1952 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1953 = torch.aten.view %1951, %1952 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1954 = torch.aten.clone %1953, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%1955 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1956 = torch.aten._unsafe_view %1954, %1955 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1957 = torch.aten.t %arg83 : !torch.tensor -> !torch.tensor | |
%1958 = torch.aten.mm %1956, %1957 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1959 = torch.aten.t %1956 : !torch.tensor -> !torch.tensor | |
%1960 = torch.aten.mm %1959, %arg84 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1961 = torch.aten.t %1960 : !torch.tensor -> !torch.tensor | |
%1962 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1963 = torch.aten.sum.dim_IntList %1956, %1962, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1964 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1965 = torch.aten.view %1963, %1964 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1966 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1967 = torch.aten.view %1958, %1966 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1968 = torch.aten.add.Tensor %1948, %1967, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1969 = torch.aten.t %1961 : !torch.tensor -> !torch.tensor | |
%1970 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%1971 = torch.aten.view %1929, %1970 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1972 = torch.aten.t %arg81 : !torch.tensor -> !torch.tensor | |
%1973 = torch.aten.mm %1971, %1972 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1974 = torch.aten.t %1971 : !torch.tensor -> !torch.tensor | |
%1975 = torch.aten.mm %1974, %arg82 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1976 = torch.aten.t %1975 : !torch.tensor -> !torch.tensor | |
%1977 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%1978 = torch.aten.sum.dim_IntList %1971, %1977, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1979 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%1980 = torch.aten.view %1978, %1979 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1981 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%1982 = torch.aten.view %1973, %1981 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%1983 = torch.aten.add.Tensor %1968, %1982, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1984 = torch.aten.t %1976 : !torch.tensor -> !torch.tensor | |
%1985 = torch.aten.sub.Tensor %arg80, %result1_4, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1986 = torch.aten.mul.Tensor %1985, %result2_5 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1987 = torch.aten.mul.Tensor %1983, %arg6 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1988 = torch.aten.mul.Tensor %1987, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1989 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1990 = torch.aten.sum.dim_IntList %1987, %1989, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1991 = torch.aten.mul.Tensor %1987, %1986 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1992 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%1993 = torch.aten.sum.dim_IntList %1991, %1992, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%1994 = torch.aten.mul.Tensor %1986, %1993 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1995 = torch.aten.sub.Tensor %1988, %1990, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1996 = torch.aten.sub.Tensor %1995, %1994, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%1997 = torch.aten.div.Tensor %result2_5, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%1998 = torch.aten.mul.Tensor %1997, %1996 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%1999 = torch.aten.mul.Tensor %1983, %1986 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2000 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2001 = torch.aten.sum.dim_IntList %1999, %2000, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2002 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2003 = torch.aten.sum.dim_IntList %1983, %2002, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2004 = torch.aten.mul.Tensor %1998, %arg79 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2005 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2006 = torch.aten.view %2004, %2005 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2007 = torch.aten.t %arg77 : !torch.tensor -> !torch.tensor | |
%2008 = torch.aten.mm %2006, %2007 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2009 = torch.aten.t %2006 : !torch.tensor -> !torch.tensor | |
%2010 = torch.aten.mm %2009, %arg78 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2011 = torch.aten.t %2010 : !torch.tensor -> !torch.tensor | |
%2012 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%2013 = torch.aten.sum.dim_IntList %2006, %2012, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2014 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%2015 = torch.aten.view %2013, %2014 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2016 = torch.prim.ListConstruct %int4, %int512, %int3072 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2017 = torch.aten.view %2008, %2016 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2018 = torch.aten.t %2011 : !torch.tensor -> !torch.tensor | |
%2019 = torch.aten.gelu_backward %2017, %arg76, %str : !torch.tensor, !torch.tensor, !torch.str -> !torch.tensor | |
%2020 = torch.prim.ListConstruct %int2048, %int3072 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2021 = torch.aten.view %2019, %2020 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2022 = torch.aten.t %arg74 : !torch.tensor -> !torch.tensor | |
%2023 = torch.aten.mm %2021, %2022 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2024 = torch.aten.t %2021 : !torch.tensor -> !torch.tensor | |
%2025 = torch.aten.mm %2024, %arg75 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2026 = torch.aten.t %2025 : !torch.tensor -> !torch.tensor | |
%2027 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%2028 = torch.aten.sum.dim_IntList %2021, %2027, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2029 = torch.prim.ListConstruct %int3072 : (!torch.int) -> !torch.list<int> | |
%2030 = torch.aten.view %2028, %2029 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2031 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2032 = torch.aten.view %2023, %2031 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2033 = torch.aten.add.Tensor %1998, %2032, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2034 = torch.aten.t %2026 : !torch.tensor -> !torch.tensor | |
%2035 = torch.aten.sub.Tensor %arg73, %result1_1, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2036 = torch.aten.mul.Tensor %2035, %result2_2 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2037 = torch.aten.mul.Tensor %2033, %arg4 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2038 = torch.aten.mul.Tensor %2037, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%2039 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%2040 = torch.aten.sum.dim_IntList %2037, %2039, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2041 = torch.aten.mul.Tensor %2037, %2036 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2042 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%2043 = torch.aten.sum.dim_IntList %2041, %2042, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2044 = torch.aten.mul.Tensor %2036, %2043 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2045 = torch.aten.sub.Tensor %2038, %2040, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2046 = torch.aten.sub.Tensor %2045, %2044, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2047 = torch.aten.div.Tensor %result2_2, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%2048 = torch.aten.mul.Tensor %2047, %2046 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2049 = torch.aten.mul.Tensor %2033, %2036 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2050 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2051 = torch.aten.sum.dim_IntList %2049, %2050, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2052 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2053 = torch.aten.sum.dim_IntList %2033, %2052, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2054 = torch.aten.mul.Tensor %2048, %arg72 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2055 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2056 = torch.aten.view %2054, %2055 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2057 = torch.aten.t %arg70 : !torch.tensor -> !torch.tensor | |
%2058 = torch.aten.mm %2056, %2057 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2059 = torch.aten.t %2056 : !torch.tensor -> !torch.tensor | |
%2060 = torch.aten.mm %2059, %arg71 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2061 = torch.aten.t %2060 : !torch.tensor -> !torch.tensor | |
%2062 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%2063 = torch.aten.sum.dim_IntList %2056, %2062, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2064 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%2065 = torch.aten.view %2063, %2064 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2066 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2067 = torch.aten.view %2058, %2066 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2068 = torch.aten.t %2061 : !torch.tensor -> !torch.tensor | |
%2069 = torch.prim.ListConstruct %int4, %int512, %int12, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2070 = torch.aten.view %2067, %2069 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2071 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2072 = torch.aten.permute %2070, %2071 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2073 = torch.aten.clone %2072, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%2074 = torch.prim.ListConstruct %int48, %int512, %int64 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2075 = torch.aten._unsafe_view %2073, %2074 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2076 = torch.aten.transpose.int %arg68, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%2077 = torch.aten.bmm %2076, %2075 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2078 = torch.aten.transpose.int %arg69, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%2079 = torch.aten.bmm %2075, %2078 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2080 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2081 = torch.aten.view %2077, %2080 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2082 = torch.prim.ListConstruct %int4, %int12, %int512, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2083 = torch.aten.view %2079, %2082 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2084 = torch.aten.mul.Tensor %2083, %arg67 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2085 = torch.aten._softmax_backward_data %2084, %arg66, %int-1, %int6 : !torch.tensor, !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%2086 = torch.aten.div.Tensor %2085, %1 : !torch.tensor, !torch.tensor<[],f64> -> !torch.tensor | |
%2087 = torch.prim.ListConstruct %int48, %int512, %int512 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2088 = torch.aten.view %2086, %2087 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2089 = torch.aten.transpose.int %arg64, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%2090 = torch.aten.bmm %2089, %2088 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2091 = torch.aten.transpose.int %arg65, %int1, %int2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%2092 = torch.aten.bmm %2088, %2091 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2093 = torch.prim.ListConstruct %int4, %int12, %int64, %int512 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2094 = torch.aten.view %2090, %2093 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2095 = torch.prim.ListConstruct %int4, %int12, %int512, %int64 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2096 = torch.aten.view %2092, %2095 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2097 = torch.aten.transpose.int %2094, %int-1, %int-2 : !torch.tensor, !torch.int, !torch.int -> !torch.tensor | |
%2098 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2099 = torch.aten.permute %2096, %2098 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2100 = torch.aten.clone %2099, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%2101 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2102 = torch.aten._unsafe_view %2100, %2101 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2103 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2104 = torch.aten.permute %2081, %2103 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2105 = torch.aten.clone %2104, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%2106 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2107 = torch.aten._unsafe_view %2105, %2106 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2108 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2109 = torch.aten.view %2107, %2108 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2110 = torch.aten.t %arg62 : !torch.tensor -> !torch.tensor | |
%2111 = torch.aten.mm %2109, %2110 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2112 = torch.aten.t %2109 : !torch.tensor -> !torch.tensor | |
%2113 = torch.aten.mm %2112, %arg63 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2114 = torch.aten.t %2113 : !torch.tensor -> !torch.tensor | |
%2115 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%2116 = torch.aten.sum.dim_IntList %2109, %2115, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2117 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%2118 = torch.aten.view %2116, %2117 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2119 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2120 = torch.aten.view %2111, %2119 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2121 = torch.aten.add.Tensor %2048, %2120, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2122 = torch.aten.t %2114 : !torch.tensor -> !torch.tensor | |
%2123 = torch.prim.ListConstruct %int0, %int2, %int1, %int3 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2124 = torch.aten.permute %2097, %2123 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2125 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2126 = torch.aten.view %2124, %2125 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2127 = torch.aten.clone %2126, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%2128 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2129 = torch.aten._unsafe_view %2127, %2128 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2130 = torch.aten.t %arg60 : !torch.tensor -> !torch.tensor | |
%2131 = torch.aten.mm %2129, %2130 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2132 = torch.aten.t %2129 : !torch.tensor -> !torch.tensor | |
%2133 = torch.aten.mm %2132, %arg61 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2134 = torch.aten.t %2133 : !torch.tensor -> !torch.tensor | |
%2135 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%2136 = torch.aten.sum.dim_IntList %2129, %2135, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2137 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%2138 = torch.aten.view %2136, %2137 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2139 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2140 = torch.aten.view %2131, %2139 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2141 = torch.aten.add.Tensor %2121, %2140, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2142 = torch.aten.t %2134 : !torch.tensor -> !torch.tensor | |
%2143 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2144 = torch.aten.view %2102, %2143 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2145 = torch.aten.t %arg58 : !torch.tensor -> !torch.tensor | |
%2146 = torch.aten.mm %2144, %2145 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2147 = torch.aten.t %2144 : !torch.tensor -> !torch.tensor | |
%2148 = torch.aten.mm %2147, %arg59 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2149 = torch.aten.t %2148 : !torch.tensor -> !torch.tensor | |
%2150 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%2151 = torch.aten.sum.dim_IntList %2144, %2150, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2152 = torch.prim.ListConstruct %int768 : (!torch.int) -> !torch.list<int> | |
%2153 = torch.aten.view %2151, %2152 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2154 = torch.prim.ListConstruct %int4, %int512, %int768 : (!torch.int, !torch.int, !torch.int) -> !torch.list<int> | |
%2155 = torch.aten.view %2146, %2154 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2156 = torch.aten.add.Tensor %2141, %2155, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2157 = torch.aten.t %2149 : !torch.tensor -> !torch.tensor | |
%2158 = torch.aten.mul.Tensor %2156, %arg57 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2159 = torch.aten.sub.Tensor %arg56, %result1, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2160 = torch.aten.mul.Tensor %2159, %result2 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2161 = torch.aten.mul.Tensor %2158, %arg2 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2162 = torch.aten.mul.Tensor %2161, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%2163 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%2164 = torch.aten.sum.dim_IntList %2161, %2163, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2165 = torch.aten.mul.Tensor %2161, %2160 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2166 = torch.prim.ListConstruct %int2 : (!torch.int) -> !torch.list<int> | |
%2167 = torch.aten.sum.dim_IntList %2165, %2166, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2168 = torch.aten.mul.Tensor %2160, %2167 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2169 = torch.aten.sub.Tensor %2162, %2164, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2170 = torch.aten.sub.Tensor %2169, %2168, %int1 : !torch.tensor, !torch.tensor, !torch.int -> !torch.tensor | |
%2171 = torch.aten.div.Tensor %result2, %2 : !torch.tensor, !torch.tensor<[],si64> -> !torch.tensor | |
%2172 = torch.aten.mul.Tensor %2171, %2170 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2173 = torch.aten.mul.Tensor %2158, %2160 : !torch.tensor, !torch.tensor -> !torch.tensor | |
%2174 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2175 = torch.aten.sum.dim_IntList %2173, %2174, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2176 = torch.prim.ListConstruct %int0, %int1 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2177 = torch.aten.sum.dim_IntList %2158, %2176, %false, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2178 = torch.prim.ListConstruct %int0 : (!torch.int) -> !torch.list<int> | |
%2179 = torch.aten.sum.dim_IntList %2172, %2178, %true, %none : !torch.tensor, !torch.list<int>, !torch.bool, !torch.none -> !torch.tensor | |
%2180 = torch.prim.ListConstruct %int512, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2181 = torch.aten.view %2179, %2180 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2182 = torch.prim.ListConstruct %int512, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2183 = torch.aten.new_empty %2179, %2182, %int6, %int0, %cpu, %false : !torch.tensor, !torch.list<int>, !torch.int, !torch.int, !torch.Device, !torch.bool -> !torch.tensor | |
%2184 = torch.aten.zero_ %2183 : !torch.tensor -> !torch.tensor | |
%2185 = torch.prim.ListConstruct %int512 : (!torch.int) -> !torch.list<int> | |
%2186 = torch.aten.view %arg55, %2185 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2187 = torch.aten.ne.Scalar %2186, %int-1 : !torch.tensor, !torch.int -> !torch.tensor | |
%2188 = torch.aten.unsqueeze %2187, %int1 : !torch.tensor, !torch.int -> !torch.tensor | |
%2189 = torch.prim.ListConstruct %int512, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2190 = torch.aten.expand %2188, %2189, %false : !torch.tensor, !torch.list<int>, !torch.bool -> !torch.tensor | |
%2191 = torch.aten.full_like %2181, %int0, %int6, %int0, %cpu, %false, %none : !torch.tensor, !torch.int, !torch.int, !torch.int, !torch.Device, !torch.bool, !torch.none -> !torch.tensor | |
%2192 = torch.aten.where.self %2190, %2181, %2191 : !torch.tensor, !torch.tensor, !torch.tensor -> !torch.tensor | |
%2193 = torch.prim.ListConstruct %2186 : (!torch.tensor) -> !torch.list<tensor> | |
%2194 = torch.operator "aten.index_put.hacked_twin"(%2184, %2193, %2192, %true) : (!torch.tensor, !torch.list<tensor>, !torch.tensor, !torch.bool) -> !torch.tensor | |
%2195 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2196 = torch.aten.view %2172, %2195 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2197 = torch.prim.ListConstruct %int2, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2198 = torch.aten.new_empty %2172, %2197, %int6, %int0, %cpu, %false : !torch.tensor, !torch.list<int>, !torch.int, !torch.int, !torch.Device, !torch.bool -> !torch.tensor | |
%2199 = torch.aten.zero_ %2198 : !torch.tensor -> !torch.tensor | |
%2200 = torch.aten.clone %arg54, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%2201 = torch.prim.ListConstruct %int2048 : (!torch.int) -> !torch.list<int> | |
%2202 = torch.aten._unsafe_view %2200, %2201 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2203 = torch.aten.ne.Scalar %2202, %int-1 : !torch.tensor, !torch.int -> !torch.tensor | |
%2204 = torch.aten.unsqueeze %2203, %int1 : !torch.tensor, !torch.int -> !torch.tensor | |
%2205 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2206 = torch.aten.expand %2204, %2205, %false : !torch.tensor, !torch.list<int>, !torch.bool -> !torch.tensor | |
%2207 = torch.aten.full_like %2196, %int0, %int6, %int0, %cpu, %false, %none : !torch.tensor, !torch.int, !torch.int, !torch.int, !torch.Device, !torch.bool, !torch.none -> !torch.tensor | |
%2208 = torch.aten.where.self %2206, %2196, %2207 : !torch.tensor, !torch.tensor, !torch.tensor -> !torch.tensor | |
%2209 = torch.prim.ListConstruct %2202 : (!torch.tensor) -> !torch.list<tensor> | |
%2210 = torch.operator "aten.index_put.hacked_twin"(%2199, %2209, %2208, %true) : (!torch.tensor, !torch.list<tensor>, !torch.tensor, !torch.bool) -> !torch.tensor | |
%2211 = torch.prim.ListConstruct %int30522, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2212 = torch.aten.new_empty %2172, %2211, %int6, %int0, %cpu, %false : !torch.tensor, !torch.list<int>, !torch.int, !torch.int, !torch.Device, !torch.bool -> !torch.tensor | |
%2213 = torch.aten.zero_ %2212 : !torch.tensor -> !torch.tensor | |
%2214 = torch.prim.ListConstruct %int2048 : (!torch.int) -> !torch.list<int> | |
%2215 = torch.aten.view %arg53, %2214 : !torch.tensor, !torch.list<int> -> !torch.tensor | |
%2216 = torch.aten.ne.Scalar %2215, %int0 : !torch.tensor, !torch.int -> !torch.tensor | |
%2217 = torch.aten.unsqueeze %2216, %int1 : !torch.tensor, !torch.int -> !torch.tensor | |
%2218 = torch.prim.ListConstruct %int2048, %int768 : (!torch.int, !torch.int) -> !torch.list<int> | |
%2219 = torch.aten.expand %2217, %2218, %false : !torch.tensor, !torch.list<int>, !torch.bool -> !torch.tensor | |
%2220 = torch.aten.where.self %2219, %2196, %2207 : !torch.tensor, !torch.tensor, !torch.tensor -> !torch.tensor | |
%2221 = torch.prim.ListConstruct %2215 : (!torch.tensor) -> !torch.list<tensor> | |
%2222 = torch.aten.where.self %2219, %2196, %2207 : !torch.tensor, !torch.tensor, !torch.tensor -> !torch.tensor | |
%2223 = torch.prim.TupleConstruct %2177, %2175, %2194, %2210, %2222, %2053, %2051, %2065, %2068, %2138, %2142, %2153, %2157, %2118, %2122, %2030, %2034, %2003, %2001, %2015, %2018, %1880, %1878, %1892, %1895, %1965, %1969, %1980, %1984, %1945, %1949, %1857, %1861, %1830, %1828, %1842, %1845, %323, %321, %335, %338, %408, %412, %423, %427, %388, %392, %300, %304, %273, %271, %285, %288, %150, %148, %162, %165, %235, %239, %250, %254, %215, %219, %127, %131, %100, %98, %112, %115, %1707, %1705, %1719, %1722, %1792, %1796, %1807, %1811, %1772, %1776, %1684, %1688, %1657, %1655, %1669, %1672, %1534, %1532, %1546, %1549, %1619, %1623, %1634, %1638, %1599, %1603, %1511, %1515, %1484, %1482, %1496, %1499, %1361, %1359, %1373, %1376, %1446, %1450, %1461, %1465, %1426, %1430, %1338, %1342, %1311, %1309, %1323, %1326, %1188, %1186, %1200, %1203, %1273, %1277, %1288, %1292, %1253, %1257, %1165, %1169, %1138, %1136, %1150, %1153, %1015, %1013, %1027, %1030, %1100, %1104, %1115, %1119, %1080, %1084, %992, %996, %965, %963, %977, %980, %842, %840, %854, %857, %927, %931, %942, %946, %907, %911, %819, %823, %792, %790, %804, %807, %669, %667, %681, %684, %754, %758, %769, %773, %734, %738, %646, %650, %619, %617, %631, %634, %496, %494, %508, %511, %581, %585, %596, %600, %561, %565, %473, %477, %446, %444, %458, %461, %non, %44, %47, %66, %64, %78, %81, %81, %81, %81, %81 : !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor, !torch.tensor -> !torch.tuple<tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor> | |
return %2223 : !torch.tuple<tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor, tensor> | |
} | |
torch.class_type @__torch__.torch.fx.graph_module.___torch_mangle_2.GraphModule { | |
torch.method "forward", @__torch__.torch.fx.graph_module.___torch_mangle_2.GraphModule.forward | |
} | |
%0 = torch.nn_module { | |
} : !torch.nn.Module<"__torch__.torch.fx.graph_module.___torch_mangle_2.GraphModule"> | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment