#map = affine_map<(d0, d1, d2) -> (d1, d2)> #map1 = affine_map<(d0, d1, d2) -> (d0, d1, d2)> module @module { util.global private @__auto.constant_2048_50_torch.complex64 = dense_resource<__auto.constant_2048_50_torch.complex64> : tensor<2048x50xcomplex> util.global private @__auto.token_embd.weight = #stream.parameter.named<"model"::"token_embd.weight"> : tensor<32000x3200xf16> util.global private @__auto.blk.0.attn_norm.weight = #stream.parameter.named<"model"::"blk.0.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.0.attn_q.weight = #stream.parameter.named<"model"::"blk.0.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.0.attn_k.weight = #stream.parameter.named<"model"::"blk.0.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.0.attn_v.weight = #stream.parameter.named<"model"::"blk.0.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.0.attn_output.weight = #stream.parameter.named<"model"::"blk.0.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.0.ffn_norm.weight = #stream.parameter.named<"model"::"blk.0.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.0.ffn_gate.weight = #stream.parameter.named<"model"::"blk.0.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.0.ffn_up.weight = #stream.parameter.named<"model"::"blk.0.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.0.ffn_down.weight = #stream.parameter.named<"model"::"blk.0.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.1.attn_norm.weight = #stream.parameter.named<"model"::"blk.1.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.1.attn_q.weight = #stream.parameter.named<"model"::"blk.1.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.1.attn_k.weight = #stream.parameter.named<"model"::"blk.1.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.1.attn_v.weight = #stream.parameter.named<"model"::"blk.1.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.1.attn_output.weight = #stream.parameter.named<"model"::"blk.1.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.1.ffn_norm.weight = #stream.parameter.named<"model"::"blk.1.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.1.ffn_gate.weight = #stream.parameter.named<"model"::"blk.1.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.1.ffn_up.weight = #stream.parameter.named<"model"::"blk.1.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.1.ffn_down.weight = #stream.parameter.named<"model"::"blk.1.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.2.attn_norm.weight = #stream.parameter.named<"model"::"blk.2.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.2.attn_q.weight = #stream.parameter.named<"model"::"blk.2.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.2.attn_k.weight = #stream.parameter.named<"model"::"blk.2.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.2.attn_v.weight = #stream.parameter.named<"model"::"blk.2.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.2.attn_output.weight = #stream.parameter.named<"model"::"blk.2.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.2.ffn_norm.weight = #stream.parameter.named<"model"::"blk.2.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.2.ffn_gate.weight = #stream.parameter.named<"model"::"blk.2.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.2.ffn_up.weight = #stream.parameter.named<"model"::"blk.2.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.2.ffn_down.weight = #stream.parameter.named<"model"::"blk.2.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.3.attn_norm.weight = #stream.parameter.named<"model"::"blk.3.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.3.attn_q.weight = #stream.parameter.named<"model"::"blk.3.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.3.attn_k.weight = #stream.parameter.named<"model"::"blk.3.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.3.attn_v.weight = #stream.parameter.named<"model"::"blk.3.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.3.attn_output.weight = #stream.parameter.named<"model"::"blk.3.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.3.ffn_norm.weight = #stream.parameter.named<"model"::"blk.3.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.3.ffn_gate.weight = #stream.parameter.named<"model"::"blk.3.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.3.ffn_up.weight = #stream.parameter.named<"model"::"blk.3.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.3.ffn_down.weight = #stream.parameter.named<"model"::"blk.3.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.4.attn_norm.weight = #stream.parameter.named<"model"::"blk.4.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.4.attn_q.weight = #stream.parameter.named<"model"::"blk.4.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.4.attn_k.weight = #stream.parameter.named<"model"::"blk.4.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.4.attn_v.weight = #stream.parameter.named<"model"::"blk.4.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.4.attn_output.weight = #stream.parameter.named<"model"::"blk.4.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.4.ffn_norm.weight = #stream.parameter.named<"model"::"blk.4.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.4.ffn_gate.weight = #stream.parameter.named<"model"::"blk.4.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.4.ffn_up.weight = #stream.parameter.named<"model"::"blk.4.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.4.ffn_down.weight = #stream.parameter.named<"model"::"blk.4.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.5.attn_norm.weight = #stream.parameter.named<"model"::"blk.5.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.5.attn_q.weight = #stream.parameter.named<"model"::"blk.5.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.5.attn_k.weight = #stream.parameter.named<"model"::"blk.5.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.5.attn_v.weight = #stream.parameter.named<"model"::"blk.5.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.5.attn_output.weight = #stream.parameter.named<"model"::"blk.5.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.5.ffn_norm.weight = #stream.parameter.named<"model"::"blk.5.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.5.ffn_gate.weight = #stream.parameter.named<"model"::"blk.5.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.5.ffn_up.weight = #stream.parameter.named<"model"::"blk.5.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.5.ffn_down.weight = #stream.parameter.named<"model"::"blk.5.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.6.attn_norm.weight = #stream.parameter.named<"model"::"blk.6.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.6.attn_q.weight = #stream.parameter.named<"model"::"blk.6.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.6.attn_k.weight = #stream.parameter.named<"model"::"blk.6.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.6.attn_v.weight = #stream.parameter.named<"model"::"blk.6.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.6.attn_output.weight = #stream.parameter.named<"model"::"blk.6.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.6.ffn_norm.weight = #stream.parameter.named<"model"::"blk.6.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.6.ffn_gate.weight = #stream.parameter.named<"model"::"blk.6.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.6.ffn_up.weight = #stream.parameter.named<"model"::"blk.6.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.6.ffn_down.weight = #stream.parameter.named<"model"::"blk.6.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.7.attn_norm.weight = #stream.parameter.named<"model"::"blk.7.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.7.attn_q.weight = #stream.parameter.named<"model"::"blk.7.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.7.attn_k.weight = #stream.parameter.named<"model"::"blk.7.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.7.attn_v.weight = #stream.parameter.named<"model"::"blk.7.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.7.attn_output.weight = #stream.parameter.named<"model"::"blk.7.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.7.ffn_norm.weight = #stream.parameter.named<"model"::"blk.7.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.7.ffn_gate.weight = #stream.parameter.named<"model"::"blk.7.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.7.ffn_up.weight = #stream.parameter.named<"model"::"blk.7.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.7.ffn_down.weight = #stream.parameter.named<"model"::"blk.7.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.8.attn_norm.weight = #stream.parameter.named<"model"::"blk.8.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.8.attn_q.weight = #stream.parameter.named<"model"::"blk.8.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.8.attn_k.weight = #stream.parameter.named<"model"::"blk.8.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.8.attn_v.weight = #stream.parameter.named<"model"::"blk.8.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.8.attn_output.weight = #stream.parameter.named<"model"::"blk.8.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.8.ffn_norm.weight = #stream.parameter.named<"model"::"blk.8.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.8.ffn_gate.weight = #stream.parameter.named<"model"::"blk.8.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.8.ffn_up.weight = #stream.parameter.named<"model"::"blk.8.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.8.ffn_down.weight = #stream.parameter.named<"model"::"blk.8.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.9.attn_norm.weight = #stream.parameter.named<"model"::"blk.9.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.9.attn_q.weight = #stream.parameter.named<"model"::"blk.9.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.9.attn_k.weight = #stream.parameter.named<"model"::"blk.9.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.9.attn_v.weight = #stream.parameter.named<"model"::"blk.9.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.9.attn_output.weight = #stream.parameter.named<"model"::"blk.9.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.9.ffn_norm.weight = #stream.parameter.named<"model"::"blk.9.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.9.ffn_gate.weight = #stream.parameter.named<"model"::"blk.9.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.9.ffn_up.weight = #stream.parameter.named<"model"::"blk.9.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.9.ffn_down.weight = #stream.parameter.named<"model"::"blk.9.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.10.attn_norm.weight = #stream.parameter.named<"model"::"blk.10.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.10.attn_q.weight = #stream.parameter.named<"model"::"blk.10.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.10.attn_k.weight = #stream.parameter.named<"model"::"blk.10.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.10.attn_v.weight = #stream.parameter.named<"model"::"blk.10.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.10.attn_output.weight = #stream.parameter.named<"model"::"blk.10.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.10.ffn_norm.weight = #stream.parameter.named<"model"::"blk.10.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.10.ffn_gate.weight = #stream.parameter.named<"model"::"blk.10.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.10.ffn_up.weight = #stream.parameter.named<"model"::"blk.10.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.10.ffn_down.weight = #stream.parameter.named<"model"::"blk.10.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.11.attn_norm.weight = #stream.parameter.named<"model"::"blk.11.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.11.attn_q.weight = #stream.parameter.named<"model"::"blk.11.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.11.attn_k.weight = #stream.parameter.named<"model"::"blk.11.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.11.attn_v.weight = #stream.parameter.named<"model"::"blk.11.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.11.attn_output.weight = #stream.parameter.named<"model"::"blk.11.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.11.ffn_norm.weight = #stream.parameter.named<"model"::"blk.11.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.11.ffn_gate.weight = #stream.parameter.named<"model"::"blk.11.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.11.ffn_up.weight = #stream.parameter.named<"model"::"blk.11.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.11.ffn_down.weight = #stream.parameter.named<"model"::"blk.11.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.12.attn_norm.weight = #stream.parameter.named<"model"::"blk.12.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.12.attn_q.weight = #stream.parameter.named<"model"::"blk.12.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.12.attn_k.weight = #stream.parameter.named<"model"::"blk.12.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.12.attn_v.weight = #stream.parameter.named<"model"::"blk.12.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.12.attn_output.weight = #stream.parameter.named<"model"::"blk.12.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.12.ffn_norm.weight = #stream.parameter.named<"model"::"blk.12.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.12.ffn_gate.weight = #stream.parameter.named<"model"::"blk.12.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.12.ffn_up.weight = #stream.parameter.named<"model"::"blk.12.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.12.ffn_down.weight = #stream.parameter.named<"model"::"blk.12.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.13.attn_norm.weight = #stream.parameter.named<"model"::"blk.13.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.13.attn_q.weight = #stream.parameter.named<"model"::"blk.13.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.13.attn_k.weight = #stream.parameter.named<"model"::"blk.13.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.13.attn_v.weight = #stream.parameter.named<"model"::"blk.13.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.13.attn_output.weight = #stream.parameter.named<"model"::"blk.13.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.13.ffn_norm.weight = #stream.parameter.named<"model"::"blk.13.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.13.ffn_gate.weight = #stream.parameter.named<"model"::"blk.13.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.13.ffn_up.weight = #stream.parameter.named<"model"::"blk.13.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.13.ffn_down.weight = #stream.parameter.named<"model"::"blk.13.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.14.attn_norm.weight = #stream.parameter.named<"model"::"blk.14.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.14.attn_q.weight = #stream.parameter.named<"model"::"blk.14.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.14.attn_k.weight = #stream.parameter.named<"model"::"blk.14.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.14.attn_v.weight = #stream.parameter.named<"model"::"blk.14.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.14.attn_output.weight = #stream.parameter.named<"model"::"blk.14.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.14.ffn_norm.weight = #stream.parameter.named<"model"::"blk.14.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.14.ffn_gate.weight = #stream.parameter.named<"model"::"blk.14.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.14.ffn_up.weight = #stream.parameter.named<"model"::"blk.14.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.14.ffn_down.weight = #stream.parameter.named<"model"::"blk.14.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.15.attn_norm.weight = #stream.parameter.named<"model"::"blk.15.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.15.attn_q.weight = #stream.parameter.named<"model"::"blk.15.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.15.attn_k.weight = #stream.parameter.named<"model"::"blk.15.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.15.attn_v.weight = #stream.parameter.named<"model"::"blk.15.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.15.attn_output.weight = #stream.parameter.named<"model"::"blk.15.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.15.ffn_norm.weight = #stream.parameter.named<"model"::"blk.15.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.15.ffn_gate.weight = #stream.parameter.named<"model"::"blk.15.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.15.ffn_up.weight = #stream.parameter.named<"model"::"blk.15.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.15.ffn_down.weight = #stream.parameter.named<"model"::"blk.15.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.16.attn_norm.weight = #stream.parameter.named<"model"::"blk.16.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.16.attn_q.weight = #stream.parameter.named<"model"::"blk.16.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.16.attn_k.weight = #stream.parameter.named<"model"::"blk.16.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.16.attn_v.weight = #stream.parameter.named<"model"::"blk.16.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.16.attn_output.weight = #stream.parameter.named<"model"::"blk.16.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.16.ffn_norm.weight = #stream.parameter.named<"model"::"blk.16.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.16.ffn_gate.weight = #stream.parameter.named<"model"::"blk.16.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.16.ffn_up.weight = #stream.parameter.named<"model"::"blk.16.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.16.ffn_down.weight = #stream.parameter.named<"model"::"blk.16.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.17.attn_norm.weight = #stream.parameter.named<"model"::"blk.17.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.17.attn_q.weight = #stream.parameter.named<"model"::"blk.17.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.17.attn_k.weight = #stream.parameter.named<"model"::"blk.17.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.17.attn_v.weight = #stream.parameter.named<"model"::"blk.17.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.17.attn_output.weight = #stream.parameter.named<"model"::"blk.17.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.17.ffn_norm.weight = #stream.parameter.named<"model"::"blk.17.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.17.ffn_gate.weight = #stream.parameter.named<"model"::"blk.17.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.17.ffn_up.weight = #stream.parameter.named<"model"::"blk.17.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.17.ffn_down.weight = #stream.parameter.named<"model"::"blk.17.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.18.attn_norm.weight = #stream.parameter.named<"model"::"blk.18.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.18.attn_q.weight = #stream.parameter.named<"model"::"blk.18.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.18.attn_k.weight = #stream.parameter.named<"model"::"blk.18.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.18.attn_v.weight = #stream.parameter.named<"model"::"blk.18.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.18.attn_output.weight = #stream.parameter.named<"model"::"blk.18.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.18.ffn_norm.weight = #stream.parameter.named<"model"::"blk.18.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.18.ffn_gate.weight = #stream.parameter.named<"model"::"blk.18.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.18.ffn_up.weight = #stream.parameter.named<"model"::"blk.18.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.18.ffn_down.weight = #stream.parameter.named<"model"::"blk.18.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.19.attn_norm.weight = #stream.parameter.named<"model"::"blk.19.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.19.attn_q.weight = #stream.parameter.named<"model"::"blk.19.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.19.attn_k.weight = #stream.parameter.named<"model"::"blk.19.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.19.attn_v.weight = #stream.parameter.named<"model"::"blk.19.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.19.attn_output.weight = #stream.parameter.named<"model"::"blk.19.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.19.ffn_norm.weight = #stream.parameter.named<"model"::"blk.19.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.19.ffn_gate.weight = #stream.parameter.named<"model"::"blk.19.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.19.ffn_up.weight = #stream.parameter.named<"model"::"blk.19.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.19.ffn_down.weight = #stream.parameter.named<"model"::"blk.19.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.20.attn_norm.weight = #stream.parameter.named<"model"::"blk.20.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.20.attn_q.weight = #stream.parameter.named<"model"::"blk.20.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.20.attn_k.weight = #stream.parameter.named<"model"::"blk.20.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.20.attn_v.weight = #stream.parameter.named<"model"::"blk.20.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.20.attn_output.weight = #stream.parameter.named<"model"::"blk.20.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.20.ffn_norm.weight = #stream.parameter.named<"model"::"blk.20.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.20.ffn_gate.weight = #stream.parameter.named<"model"::"blk.20.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.20.ffn_up.weight = #stream.parameter.named<"model"::"blk.20.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.20.ffn_down.weight = #stream.parameter.named<"model"::"blk.20.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.21.attn_norm.weight = #stream.parameter.named<"model"::"blk.21.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.21.attn_q.weight = #stream.parameter.named<"model"::"blk.21.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.21.attn_k.weight = #stream.parameter.named<"model"::"blk.21.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.21.attn_v.weight = #stream.parameter.named<"model"::"blk.21.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.21.attn_output.weight = #stream.parameter.named<"model"::"blk.21.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.21.ffn_norm.weight = #stream.parameter.named<"model"::"blk.21.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.21.ffn_gate.weight = #stream.parameter.named<"model"::"blk.21.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.21.ffn_up.weight = #stream.parameter.named<"model"::"blk.21.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.21.ffn_down.weight = #stream.parameter.named<"model"::"blk.21.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.22.attn_norm.weight = #stream.parameter.named<"model"::"blk.22.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.22.attn_q.weight = #stream.parameter.named<"model"::"blk.22.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.22.attn_k.weight = #stream.parameter.named<"model"::"blk.22.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.22.attn_v.weight = #stream.parameter.named<"model"::"blk.22.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.22.attn_output.weight = #stream.parameter.named<"model"::"blk.22.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.22.ffn_norm.weight = #stream.parameter.named<"model"::"blk.22.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.22.ffn_gate.weight = #stream.parameter.named<"model"::"blk.22.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.22.ffn_up.weight = #stream.parameter.named<"model"::"blk.22.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.22.ffn_down.weight = #stream.parameter.named<"model"::"blk.22.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.23.attn_norm.weight = #stream.parameter.named<"model"::"blk.23.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.23.attn_q.weight = #stream.parameter.named<"model"::"blk.23.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.23.attn_k.weight = #stream.parameter.named<"model"::"blk.23.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.23.attn_v.weight = #stream.parameter.named<"model"::"blk.23.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.23.attn_output.weight = #stream.parameter.named<"model"::"blk.23.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.23.ffn_norm.weight = #stream.parameter.named<"model"::"blk.23.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.23.ffn_gate.weight = #stream.parameter.named<"model"::"blk.23.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.23.ffn_up.weight = #stream.parameter.named<"model"::"blk.23.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.23.ffn_down.weight = #stream.parameter.named<"model"::"blk.23.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.24.attn_norm.weight = #stream.parameter.named<"model"::"blk.24.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.24.attn_q.weight = #stream.parameter.named<"model"::"blk.24.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.24.attn_k.weight = #stream.parameter.named<"model"::"blk.24.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.24.attn_v.weight = #stream.parameter.named<"model"::"blk.24.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.24.attn_output.weight = #stream.parameter.named<"model"::"blk.24.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.24.ffn_norm.weight = #stream.parameter.named<"model"::"blk.24.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.24.ffn_gate.weight = #stream.parameter.named<"model"::"blk.24.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.24.ffn_up.weight = #stream.parameter.named<"model"::"blk.24.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.24.ffn_down.weight = #stream.parameter.named<"model"::"blk.24.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.blk.25.attn_norm.weight = #stream.parameter.named<"model"::"blk.25.attn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.25.attn_q.weight = #stream.parameter.named<"model"::"blk.25.attn_q.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.25.attn_k.weight = #stream.parameter.named<"model"::"blk.25.attn_k.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.25.attn_v.weight = #stream.parameter.named<"model"::"blk.25.attn_v.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.25.attn_output.weight = #stream.parameter.named<"model"::"blk.25.attn_output.weight"> : tensor<3200x3200xf16> util.global private @__auto.blk.25.ffn_norm.weight = #stream.parameter.named<"model"::"blk.25.ffn_norm.weight"> : tensor<3200xf32> util.global private @__auto.blk.25.ffn_gate.weight = #stream.parameter.named<"model"::"blk.25.ffn_gate.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.25.ffn_up.weight = #stream.parameter.named<"model"::"blk.25.ffn_up.weight"> : tensor<8640x3200xf16> util.global private @__auto.blk.25.ffn_down.weight = #stream.parameter.named<"model"::"blk.25.ffn_down.weight"> : tensor<3200x8640xf16> util.global private @__auto.output_norm.weight = #stream.parameter.named<"model"::"output_norm.weight"> : tensor<3200xf32> util.global private @__auto.output.weight = #stream.parameter.named<"model"::"output.weight"> : tensor<32000x3200xf16> func.func @decode_bs4(%arg0: !torch.vtensor<[4,1],si64>, %arg1: !torch.vtensor<[4],si64>, %arg2: !torch.vtensor<[4],si64>, %arg3: !torch.vtensor<[4,?],si64>, %arg4: !torch.tensor<[?,2662400],f32>) -> !torch.vtensor<[4,1,32000],f32> { %__auto.constant_2048_50_torch.complex64 = util.global.load @__auto.constant_2048_50_torch.complex64 : tensor<2048x50xcomplex> %0 = torch_c.from_builtin_tensor %__auto.constant_2048_50_torch.complex64 : tensor<2048x50xcomplex> -> !torch.vtensor<[2048,50],complex> %__auto.token_embd.weight = util.global.load @__auto.token_embd.weight : tensor<32000x3200xf16> %1 = torch_c.from_builtin_tensor %__auto.token_embd.weight : tensor<32000x3200xf16> -> !torch.vtensor<[32000,3200],f16> %__auto.blk.0.attn_norm.weight = util.global.load @__auto.blk.0.attn_norm.weight : tensor<3200xf32> %2 = torch_c.from_builtin_tensor %__auto.blk.0.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.0.attn_q.weight = util.global.load @__auto.blk.0.attn_q.weight : tensor<3200x3200xf16> %3 = torch_c.from_builtin_tensor %__auto.blk.0.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.0.attn_k.weight = util.global.load @__auto.blk.0.attn_k.weight : tensor<3200x3200xf16> %4 = torch_c.from_builtin_tensor %__auto.blk.0.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.0.attn_v.weight = util.global.load @__auto.blk.0.attn_v.weight : tensor<3200x3200xf16> %5 = torch_c.from_builtin_tensor %__auto.blk.0.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.0.attn_output.weight = util.global.load @__auto.blk.0.attn_output.weight : tensor<3200x3200xf16> %6 = torch_c.from_builtin_tensor %__auto.blk.0.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.0.ffn_norm.weight = util.global.load @__auto.blk.0.ffn_norm.weight : tensor<3200xf32> %7 = torch_c.from_builtin_tensor %__auto.blk.0.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.0.ffn_gate.weight = util.global.load @__auto.blk.0.ffn_gate.weight : tensor<8640x3200xf16> %8 = torch_c.from_builtin_tensor %__auto.blk.0.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.0.ffn_up.weight = util.global.load @__auto.blk.0.ffn_up.weight : tensor<8640x3200xf16> %9 = torch_c.from_builtin_tensor %__auto.blk.0.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.0.ffn_down.weight = util.global.load @__auto.blk.0.ffn_down.weight : tensor<3200x8640xf16> %10 = torch_c.from_builtin_tensor %__auto.blk.0.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.1.attn_norm.weight = util.global.load @__auto.blk.1.attn_norm.weight : tensor<3200xf32> %11 = torch_c.from_builtin_tensor %__auto.blk.1.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.1.attn_q.weight = util.global.load @__auto.blk.1.attn_q.weight : tensor<3200x3200xf16> %12 = torch_c.from_builtin_tensor %__auto.blk.1.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.1.attn_k.weight = util.global.load @__auto.blk.1.attn_k.weight : tensor<3200x3200xf16> %13 = torch_c.from_builtin_tensor %__auto.blk.1.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.1.attn_v.weight = util.global.load @__auto.blk.1.attn_v.weight : tensor<3200x3200xf16> %14 = torch_c.from_builtin_tensor %__auto.blk.1.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.1.attn_output.weight = util.global.load @__auto.blk.1.attn_output.weight : tensor<3200x3200xf16> %15 = torch_c.from_builtin_tensor %__auto.blk.1.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.1.ffn_norm.weight = util.global.load @__auto.blk.1.ffn_norm.weight : tensor<3200xf32> %16 = torch_c.from_builtin_tensor %__auto.blk.1.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.1.ffn_gate.weight = util.global.load @__auto.blk.1.ffn_gate.weight : tensor<8640x3200xf16> %17 = torch_c.from_builtin_tensor %__auto.blk.1.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.1.ffn_up.weight = util.global.load @__auto.blk.1.ffn_up.weight : tensor<8640x3200xf16> %18 = torch_c.from_builtin_tensor %__auto.blk.1.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.1.ffn_down.weight = util.global.load @__auto.blk.1.ffn_down.weight : tensor<3200x8640xf16> %19 = torch_c.from_builtin_tensor %__auto.blk.1.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.2.attn_norm.weight = util.global.load @__auto.blk.2.attn_norm.weight : tensor<3200xf32> %20 = torch_c.from_builtin_tensor %__auto.blk.2.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.2.attn_q.weight = util.global.load @__auto.blk.2.attn_q.weight : tensor<3200x3200xf16> %21 = torch_c.from_builtin_tensor %__auto.blk.2.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.2.attn_k.weight = util.global.load @__auto.blk.2.attn_k.weight : tensor<3200x3200xf16> %22 = torch_c.from_builtin_tensor %__auto.blk.2.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.2.attn_v.weight = util.global.load @__auto.blk.2.attn_v.weight : tensor<3200x3200xf16> %23 = torch_c.from_builtin_tensor %__auto.blk.2.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.2.attn_output.weight = util.global.load @__auto.blk.2.attn_output.weight : tensor<3200x3200xf16> %24 = torch_c.from_builtin_tensor %__auto.blk.2.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.2.ffn_norm.weight = util.global.load @__auto.blk.2.ffn_norm.weight : tensor<3200xf32> %25 = torch_c.from_builtin_tensor %__auto.blk.2.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.2.ffn_gate.weight = util.global.load @__auto.blk.2.ffn_gate.weight : tensor<8640x3200xf16> %26 = torch_c.from_builtin_tensor %__auto.blk.2.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.2.ffn_up.weight = util.global.load @__auto.blk.2.ffn_up.weight : tensor<8640x3200xf16> %27 = torch_c.from_builtin_tensor %__auto.blk.2.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.2.ffn_down.weight = util.global.load @__auto.blk.2.ffn_down.weight : tensor<3200x8640xf16> %28 = torch_c.from_builtin_tensor %__auto.blk.2.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.3.attn_norm.weight = util.global.load @__auto.blk.3.attn_norm.weight : tensor<3200xf32> %29 = torch_c.from_builtin_tensor %__auto.blk.3.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.3.attn_q.weight = util.global.load @__auto.blk.3.attn_q.weight : tensor<3200x3200xf16> %30 = torch_c.from_builtin_tensor %__auto.blk.3.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.3.attn_k.weight = util.global.load @__auto.blk.3.attn_k.weight : tensor<3200x3200xf16> %31 = torch_c.from_builtin_tensor %__auto.blk.3.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.3.attn_v.weight = util.global.load @__auto.blk.3.attn_v.weight : tensor<3200x3200xf16> %32 = torch_c.from_builtin_tensor %__auto.blk.3.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.3.attn_output.weight = util.global.load @__auto.blk.3.attn_output.weight : tensor<3200x3200xf16> %33 = torch_c.from_builtin_tensor %__auto.blk.3.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.3.ffn_norm.weight = util.global.load @__auto.blk.3.ffn_norm.weight : tensor<3200xf32> %34 = torch_c.from_builtin_tensor %__auto.blk.3.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.3.ffn_gate.weight = util.global.load @__auto.blk.3.ffn_gate.weight : tensor<8640x3200xf16> %35 = torch_c.from_builtin_tensor %__auto.blk.3.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.3.ffn_up.weight = util.global.load @__auto.blk.3.ffn_up.weight : tensor<8640x3200xf16> %36 = torch_c.from_builtin_tensor %__auto.blk.3.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.3.ffn_down.weight = util.global.load @__auto.blk.3.ffn_down.weight : tensor<3200x8640xf16> %37 = torch_c.from_builtin_tensor %__auto.blk.3.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.4.attn_norm.weight = util.global.load @__auto.blk.4.attn_norm.weight : tensor<3200xf32> %38 = torch_c.from_builtin_tensor %__auto.blk.4.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.4.attn_q.weight = util.global.load @__auto.blk.4.attn_q.weight : tensor<3200x3200xf16> %39 = torch_c.from_builtin_tensor %__auto.blk.4.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.4.attn_k.weight = util.global.load @__auto.blk.4.attn_k.weight : tensor<3200x3200xf16> %40 = torch_c.from_builtin_tensor %__auto.blk.4.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.4.attn_v.weight = util.global.load @__auto.blk.4.attn_v.weight : tensor<3200x3200xf16> %41 = torch_c.from_builtin_tensor %__auto.blk.4.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.4.attn_output.weight = util.global.load @__auto.blk.4.attn_output.weight : tensor<3200x3200xf16> %42 = torch_c.from_builtin_tensor %__auto.blk.4.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.4.ffn_norm.weight = util.global.load @__auto.blk.4.ffn_norm.weight : tensor<3200xf32> %43 = torch_c.from_builtin_tensor %__auto.blk.4.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.4.ffn_gate.weight = util.global.load @__auto.blk.4.ffn_gate.weight : tensor<8640x3200xf16> %44 = torch_c.from_builtin_tensor %__auto.blk.4.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.4.ffn_up.weight = util.global.load @__auto.blk.4.ffn_up.weight : tensor<8640x3200xf16> %45 = torch_c.from_builtin_tensor %__auto.blk.4.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.4.ffn_down.weight = util.global.load @__auto.blk.4.ffn_down.weight : tensor<3200x8640xf16> %46 = torch_c.from_builtin_tensor %__auto.blk.4.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.5.attn_norm.weight = util.global.load @__auto.blk.5.attn_norm.weight : tensor<3200xf32> %47 = torch_c.from_builtin_tensor %__auto.blk.5.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.5.attn_q.weight = util.global.load @__auto.blk.5.attn_q.weight : tensor<3200x3200xf16> %48 = torch_c.from_builtin_tensor %__auto.blk.5.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.5.attn_k.weight = util.global.load @__auto.blk.5.attn_k.weight : tensor<3200x3200xf16> %49 = torch_c.from_builtin_tensor %__auto.blk.5.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.5.attn_v.weight = util.global.load @__auto.blk.5.attn_v.weight : tensor<3200x3200xf16> %50 = torch_c.from_builtin_tensor %__auto.blk.5.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.5.attn_output.weight = util.global.load @__auto.blk.5.attn_output.weight : tensor<3200x3200xf16> %51 = torch_c.from_builtin_tensor %__auto.blk.5.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.5.ffn_norm.weight = util.global.load @__auto.blk.5.ffn_norm.weight : tensor<3200xf32> %52 = torch_c.from_builtin_tensor %__auto.blk.5.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.5.ffn_gate.weight = util.global.load @__auto.blk.5.ffn_gate.weight : tensor<8640x3200xf16> %53 = torch_c.from_builtin_tensor %__auto.blk.5.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.5.ffn_up.weight = util.global.load @__auto.blk.5.ffn_up.weight : tensor<8640x3200xf16> %54 = torch_c.from_builtin_tensor %__auto.blk.5.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.5.ffn_down.weight = util.global.load @__auto.blk.5.ffn_down.weight : tensor<3200x8640xf16> %55 = torch_c.from_builtin_tensor %__auto.blk.5.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.6.attn_norm.weight = util.global.load @__auto.blk.6.attn_norm.weight : tensor<3200xf32> %56 = torch_c.from_builtin_tensor %__auto.blk.6.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.6.attn_q.weight = util.global.load @__auto.blk.6.attn_q.weight : tensor<3200x3200xf16> %57 = torch_c.from_builtin_tensor %__auto.blk.6.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.6.attn_k.weight = util.global.load @__auto.blk.6.attn_k.weight : tensor<3200x3200xf16> %58 = torch_c.from_builtin_tensor %__auto.blk.6.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.6.attn_v.weight = util.global.load @__auto.blk.6.attn_v.weight : tensor<3200x3200xf16> %59 = torch_c.from_builtin_tensor %__auto.blk.6.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.6.attn_output.weight = util.global.load @__auto.blk.6.attn_output.weight : tensor<3200x3200xf16> %60 = torch_c.from_builtin_tensor %__auto.blk.6.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.6.ffn_norm.weight = util.global.load @__auto.blk.6.ffn_norm.weight : tensor<3200xf32> %61 = torch_c.from_builtin_tensor %__auto.blk.6.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.6.ffn_gate.weight = util.global.load @__auto.blk.6.ffn_gate.weight : tensor<8640x3200xf16> %62 = torch_c.from_builtin_tensor %__auto.blk.6.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.6.ffn_up.weight = util.global.load @__auto.blk.6.ffn_up.weight : tensor<8640x3200xf16> %63 = torch_c.from_builtin_tensor %__auto.blk.6.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.6.ffn_down.weight = util.global.load @__auto.blk.6.ffn_down.weight : tensor<3200x8640xf16> %64 = torch_c.from_builtin_tensor %__auto.blk.6.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.7.attn_norm.weight = util.global.load @__auto.blk.7.attn_norm.weight : tensor<3200xf32> %65 = torch_c.from_builtin_tensor %__auto.blk.7.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.7.attn_q.weight = util.global.load @__auto.blk.7.attn_q.weight : tensor<3200x3200xf16> %66 = torch_c.from_builtin_tensor %__auto.blk.7.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.7.attn_k.weight = util.global.load @__auto.blk.7.attn_k.weight : tensor<3200x3200xf16> %67 = torch_c.from_builtin_tensor %__auto.blk.7.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.7.attn_v.weight = util.global.load @__auto.blk.7.attn_v.weight : tensor<3200x3200xf16> %68 = torch_c.from_builtin_tensor %__auto.blk.7.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.7.attn_output.weight = util.global.load @__auto.blk.7.attn_output.weight : tensor<3200x3200xf16> %69 = torch_c.from_builtin_tensor %__auto.blk.7.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.7.ffn_norm.weight = util.global.load @__auto.blk.7.ffn_norm.weight : tensor<3200xf32> %70 = torch_c.from_builtin_tensor %__auto.blk.7.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.7.ffn_gate.weight = util.global.load @__auto.blk.7.ffn_gate.weight : tensor<8640x3200xf16> %71 = torch_c.from_builtin_tensor %__auto.blk.7.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.7.ffn_up.weight = util.global.load @__auto.blk.7.ffn_up.weight : tensor<8640x3200xf16> %72 = torch_c.from_builtin_tensor %__auto.blk.7.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.7.ffn_down.weight = util.global.load @__auto.blk.7.ffn_down.weight : tensor<3200x8640xf16> %73 = torch_c.from_builtin_tensor %__auto.blk.7.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.8.attn_norm.weight = util.global.load @__auto.blk.8.attn_norm.weight : tensor<3200xf32> %74 = torch_c.from_builtin_tensor %__auto.blk.8.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.8.attn_q.weight = util.global.load @__auto.blk.8.attn_q.weight : tensor<3200x3200xf16> %75 = torch_c.from_builtin_tensor %__auto.blk.8.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.8.attn_k.weight = util.global.load @__auto.blk.8.attn_k.weight : tensor<3200x3200xf16> %76 = torch_c.from_builtin_tensor %__auto.blk.8.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.8.attn_v.weight = util.global.load @__auto.blk.8.attn_v.weight : tensor<3200x3200xf16> %77 = torch_c.from_builtin_tensor %__auto.blk.8.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.8.attn_output.weight = util.global.load @__auto.blk.8.attn_output.weight : tensor<3200x3200xf16> %78 = torch_c.from_builtin_tensor %__auto.blk.8.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.8.ffn_norm.weight = util.global.load @__auto.blk.8.ffn_norm.weight : tensor<3200xf32> %79 = torch_c.from_builtin_tensor %__auto.blk.8.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.8.ffn_gate.weight = util.global.load @__auto.blk.8.ffn_gate.weight : tensor<8640x3200xf16> %80 = torch_c.from_builtin_tensor %__auto.blk.8.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.8.ffn_up.weight = util.global.load @__auto.blk.8.ffn_up.weight : tensor<8640x3200xf16> %81 = torch_c.from_builtin_tensor %__auto.blk.8.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.8.ffn_down.weight = util.global.load @__auto.blk.8.ffn_down.weight : tensor<3200x8640xf16> %82 = torch_c.from_builtin_tensor %__auto.blk.8.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.9.attn_norm.weight = util.global.load @__auto.blk.9.attn_norm.weight : tensor<3200xf32> %83 = torch_c.from_builtin_tensor %__auto.blk.9.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.9.attn_q.weight = util.global.load @__auto.blk.9.attn_q.weight : tensor<3200x3200xf16> %84 = torch_c.from_builtin_tensor %__auto.blk.9.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.9.attn_k.weight = util.global.load @__auto.blk.9.attn_k.weight : tensor<3200x3200xf16> %85 = torch_c.from_builtin_tensor %__auto.blk.9.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.9.attn_v.weight = util.global.load @__auto.blk.9.attn_v.weight : tensor<3200x3200xf16> %86 = torch_c.from_builtin_tensor %__auto.blk.9.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.9.attn_output.weight = util.global.load @__auto.blk.9.attn_output.weight : tensor<3200x3200xf16> %87 = torch_c.from_builtin_tensor %__auto.blk.9.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.9.ffn_norm.weight = util.global.load @__auto.blk.9.ffn_norm.weight : tensor<3200xf32> %88 = torch_c.from_builtin_tensor %__auto.blk.9.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.9.ffn_gate.weight = util.global.load @__auto.blk.9.ffn_gate.weight : tensor<8640x3200xf16> %89 = torch_c.from_builtin_tensor %__auto.blk.9.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.9.ffn_up.weight = util.global.load @__auto.blk.9.ffn_up.weight : tensor<8640x3200xf16> %90 = torch_c.from_builtin_tensor %__auto.blk.9.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.9.ffn_down.weight = util.global.load @__auto.blk.9.ffn_down.weight : tensor<3200x8640xf16> %91 = torch_c.from_builtin_tensor %__auto.blk.9.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.10.attn_norm.weight = util.global.load @__auto.blk.10.attn_norm.weight : tensor<3200xf32> %92 = torch_c.from_builtin_tensor %__auto.blk.10.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.10.attn_q.weight = util.global.load @__auto.blk.10.attn_q.weight : tensor<3200x3200xf16> %93 = torch_c.from_builtin_tensor %__auto.blk.10.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.10.attn_k.weight = util.global.load @__auto.blk.10.attn_k.weight : tensor<3200x3200xf16> %94 = torch_c.from_builtin_tensor %__auto.blk.10.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.10.attn_v.weight = util.global.load @__auto.blk.10.attn_v.weight : tensor<3200x3200xf16> %95 = torch_c.from_builtin_tensor %__auto.blk.10.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.10.attn_output.weight = util.global.load @__auto.blk.10.attn_output.weight : tensor<3200x3200xf16> %96 = torch_c.from_builtin_tensor %__auto.blk.10.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.10.ffn_norm.weight = util.global.load @__auto.blk.10.ffn_norm.weight : tensor<3200xf32> %97 = torch_c.from_builtin_tensor %__auto.blk.10.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.10.ffn_gate.weight = util.global.load @__auto.blk.10.ffn_gate.weight : tensor<8640x3200xf16> %98 = torch_c.from_builtin_tensor %__auto.blk.10.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.10.ffn_up.weight = util.global.load @__auto.blk.10.ffn_up.weight : tensor<8640x3200xf16> %99 = torch_c.from_builtin_tensor %__auto.blk.10.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.10.ffn_down.weight = util.global.load @__auto.blk.10.ffn_down.weight : tensor<3200x8640xf16> %100 = torch_c.from_builtin_tensor %__auto.blk.10.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.11.attn_norm.weight = util.global.load @__auto.blk.11.attn_norm.weight : tensor<3200xf32> %101 = torch_c.from_builtin_tensor %__auto.blk.11.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.11.attn_q.weight = util.global.load @__auto.blk.11.attn_q.weight : tensor<3200x3200xf16> %102 = torch_c.from_builtin_tensor %__auto.blk.11.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.11.attn_k.weight = util.global.load @__auto.blk.11.attn_k.weight : tensor<3200x3200xf16> %103 = torch_c.from_builtin_tensor %__auto.blk.11.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.11.attn_v.weight = util.global.load @__auto.blk.11.attn_v.weight : tensor<3200x3200xf16> %104 = torch_c.from_builtin_tensor %__auto.blk.11.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.11.attn_output.weight = util.global.load @__auto.blk.11.attn_output.weight : tensor<3200x3200xf16> %105 = torch_c.from_builtin_tensor %__auto.blk.11.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.11.ffn_norm.weight = util.global.load @__auto.blk.11.ffn_norm.weight : tensor<3200xf32> %106 = torch_c.from_builtin_tensor %__auto.blk.11.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.11.ffn_gate.weight = util.global.load @__auto.blk.11.ffn_gate.weight : tensor<8640x3200xf16> %107 = torch_c.from_builtin_tensor %__auto.blk.11.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.11.ffn_up.weight = util.global.load @__auto.blk.11.ffn_up.weight : tensor<8640x3200xf16> %108 = torch_c.from_builtin_tensor %__auto.blk.11.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.11.ffn_down.weight = util.global.load @__auto.blk.11.ffn_down.weight : tensor<3200x8640xf16> %109 = torch_c.from_builtin_tensor %__auto.blk.11.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.12.attn_norm.weight = util.global.load @__auto.blk.12.attn_norm.weight : tensor<3200xf32> %110 = torch_c.from_builtin_tensor %__auto.blk.12.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.12.attn_q.weight = util.global.load @__auto.blk.12.attn_q.weight : tensor<3200x3200xf16> %111 = torch_c.from_builtin_tensor %__auto.blk.12.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.12.attn_k.weight = util.global.load @__auto.blk.12.attn_k.weight : tensor<3200x3200xf16> %112 = torch_c.from_builtin_tensor %__auto.blk.12.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.12.attn_v.weight = util.global.load @__auto.blk.12.attn_v.weight : tensor<3200x3200xf16> %113 = torch_c.from_builtin_tensor %__auto.blk.12.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.12.attn_output.weight = util.global.load @__auto.blk.12.attn_output.weight : tensor<3200x3200xf16> %114 = torch_c.from_builtin_tensor %__auto.blk.12.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.12.ffn_norm.weight = util.global.load @__auto.blk.12.ffn_norm.weight : tensor<3200xf32> %115 = torch_c.from_builtin_tensor %__auto.blk.12.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.12.ffn_gate.weight = util.global.load @__auto.blk.12.ffn_gate.weight : tensor<8640x3200xf16> %116 = torch_c.from_builtin_tensor %__auto.blk.12.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.12.ffn_up.weight = util.global.load @__auto.blk.12.ffn_up.weight : tensor<8640x3200xf16> %117 = torch_c.from_builtin_tensor %__auto.blk.12.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.12.ffn_down.weight = util.global.load @__auto.blk.12.ffn_down.weight : tensor<3200x8640xf16> %118 = torch_c.from_builtin_tensor %__auto.blk.12.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.13.attn_norm.weight = util.global.load @__auto.blk.13.attn_norm.weight : tensor<3200xf32> %119 = torch_c.from_builtin_tensor %__auto.blk.13.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.13.attn_q.weight = util.global.load @__auto.blk.13.attn_q.weight : tensor<3200x3200xf16> %120 = torch_c.from_builtin_tensor %__auto.blk.13.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.13.attn_k.weight = util.global.load @__auto.blk.13.attn_k.weight : tensor<3200x3200xf16> %121 = torch_c.from_builtin_tensor %__auto.blk.13.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.13.attn_v.weight = util.global.load @__auto.blk.13.attn_v.weight : tensor<3200x3200xf16> %122 = torch_c.from_builtin_tensor %__auto.blk.13.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.13.attn_output.weight = util.global.load @__auto.blk.13.attn_output.weight : tensor<3200x3200xf16> %123 = torch_c.from_builtin_tensor %__auto.blk.13.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.13.ffn_norm.weight = util.global.load @__auto.blk.13.ffn_norm.weight : tensor<3200xf32> %124 = torch_c.from_builtin_tensor %__auto.blk.13.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.13.ffn_gate.weight = util.global.load @__auto.blk.13.ffn_gate.weight : tensor<8640x3200xf16> %125 = torch_c.from_builtin_tensor %__auto.blk.13.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.13.ffn_up.weight = util.global.load @__auto.blk.13.ffn_up.weight : tensor<8640x3200xf16> %126 = torch_c.from_builtin_tensor %__auto.blk.13.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.13.ffn_down.weight = util.global.load @__auto.blk.13.ffn_down.weight : tensor<3200x8640xf16> %127 = torch_c.from_builtin_tensor %__auto.blk.13.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.14.attn_norm.weight = util.global.load @__auto.blk.14.attn_norm.weight : tensor<3200xf32> %128 = torch_c.from_builtin_tensor %__auto.blk.14.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.14.attn_q.weight = util.global.load @__auto.blk.14.attn_q.weight : tensor<3200x3200xf16> %129 = torch_c.from_builtin_tensor %__auto.blk.14.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.14.attn_k.weight = util.global.load @__auto.blk.14.attn_k.weight : tensor<3200x3200xf16> %130 = torch_c.from_builtin_tensor %__auto.blk.14.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.14.attn_v.weight = util.global.load @__auto.blk.14.attn_v.weight : tensor<3200x3200xf16> %131 = torch_c.from_builtin_tensor %__auto.blk.14.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.14.attn_output.weight = util.global.load @__auto.blk.14.attn_output.weight : tensor<3200x3200xf16> %132 = torch_c.from_builtin_tensor %__auto.blk.14.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.14.ffn_norm.weight = util.global.load @__auto.blk.14.ffn_norm.weight : tensor<3200xf32> %133 = torch_c.from_builtin_tensor %__auto.blk.14.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.14.ffn_gate.weight = util.global.load @__auto.blk.14.ffn_gate.weight : tensor<8640x3200xf16> %134 = torch_c.from_builtin_tensor %__auto.blk.14.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.14.ffn_up.weight = util.global.load @__auto.blk.14.ffn_up.weight : tensor<8640x3200xf16> %135 = torch_c.from_builtin_tensor %__auto.blk.14.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.14.ffn_down.weight = util.global.load @__auto.blk.14.ffn_down.weight : tensor<3200x8640xf16> %136 = torch_c.from_builtin_tensor %__auto.blk.14.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.15.attn_norm.weight = util.global.load @__auto.blk.15.attn_norm.weight : tensor<3200xf32> %137 = torch_c.from_builtin_tensor %__auto.blk.15.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.15.attn_q.weight = util.global.load @__auto.blk.15.attn_q.weight : tensor<3200x3200xf16> %138 = torch_c.from_builtin_tensor %__auto.blk.15.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.15.attn_k.weight = util.global.load @__auto.blk.15.attn_k.weight : tensor<3200x3200xf16> %139 = torch_c.from_builtin_tensor %__auto.blk.15.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.15.attn_v.weight = util.global.load @__auto.blk.15.attn_v.weight : tensor<3200x3200xf16> %140 = torch_c.from_builtin_tensor %__auto.blk.15.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.15.attn_output.weight = util.global.load @__auto.blk.15.attn_output.weight : tensor<3200x3200xf16> %141 = torch_c.from_builtin_tensor %__auto.blk.15.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.15.ffn_norm.weight = util.global.load @__auto.blk.15.ffn_norm.weight : tensor<3200xf32> %142 = torch_c.from_builtin_tensor %__auto.blk.15.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.15.ffn_gate.weight = util.global.load @__auto.blk.15.ffn_gate.weight : tensor<8640x3200xf16> %143 = torch_c.from_builtin_tensor %__auto.blk.15.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.15.ffn_up.weight = util.global.load @__auto.blk.15.ffn_up.weight : tensor<8640x3200xf16> %144 = torch_c.from_builtin_tensor %__auto.blk.15.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.15.ffn_down.weight = util.global.load @__auto.blk.15.ffn_down.weight : tensor<3200x8640xf16> %145 = torch_c.from_builtin_tensor %__auto.blk.15.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.16.attn_norm.weight = util.global.load @__auto.blk.16.attn_norm.weight : tensor<3200xf32> %146 = torch_c.from_builtin_tensor %__auto.blk.16.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.16.attn_q.weight = util.global.load @__auto.blk.16.attn_q.weight : tensor<3200x3200xf16> %147 = torch_c.from_builtin_tensor %__auto.blk.16.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.16.attn_k.weight = util.global.load @__auto.blk.16.attn_k.weight : tensor<3200x3200xf16> %148 = torch_c.from_builtin_tensor %__auto.blk.16.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.16.attn_v.weight = util.global.load @__auto.blk.16.attn_v.weight : tensor<3200x3200xf16> %149 = torch_c.from_builtin_tensor %__auto.blk.16.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.16.attn_output.weight = util.global.load @__auto.blk.16.attn_output.weight : tensor<3200x3200xf16> %150 = torch_c.from_builtin_tensor %__auto.blk.16.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.16.ffn_norm.weight = util.global.load @__auto.blk.16.ffn_norm.weight : tensor<3200xf32> %151 = torch_c.from_builtin_tensor %__auto.blk.16.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.16.ffn_gate.weight = util.global.load @__auto.blk.16.ffn_gate.weight : tensor<8640x3200xf16> %152 = torch_c.from_builtin_tensor %__auto.blk.16.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.16.ffn_up.weight = util.global.load @__auto.blk.16.ffn_up.weight : tensor<8640x3200xf16> %153 = torch_c.from_builtin_tensor %__auto.blk.16.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.16.ffn_down.weight = util.global.load @__auto.blk.16.ffn_down.weight : tensor<3200x8640xf16> %154 = torch_c.from_builtin_tensor %__auto.blk.16.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.17.attn_norm.weight = util.global.load @__auto.blk.17.attn_norm.weight : tensor<3200xf32> %155 = torch_c.from_builtin_tensor %__auto.blk.17.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.17.attn_q.weight = util.global.load @__auto.blk.17.attn_q.weight : tensor<3200x3200xf16> %156 = torch_c.from_builtin_tensor %__auto.blk.17.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.17.attn_k.weight = util.global.load @__auto.blk.17.attn_k.weight : tensor<3200x3200xf16> %157 = torch_c.from_builtin_tensor %__auto.blk.17.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.17.attn_v.weight = util.global.load @__auto.blk.17.attn_v.weight : tensor<3200x3200xf16> %158 = torch_c.from_builtin_tensor %__auto.blk.17.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.17.attn_output.weight = util.global.load @__auto.blk.17.attn_output.weight : tensor<3200x3200xf16> %159 = torch_c.from_builtin_tensor %__auto.blk.17.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.17.ffn_norm.weight = util.global.load @__auto.blk.17.ffn_norm.weight : tensor<3200xf32> %160 = torch_c.from_builtin_tensor %__auto.blk.17.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.17.ffn_gate.weight = util.global.load @__auto.blk.17.ffn_gate.weight : tensor<8640x3200xf16> %161 = torch_c.from_builtin_tensor %__auto.blk.17.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.17.ffn_up.weight = util.global.load @__auto.blk.17.ffn_up.weight : tensor<8640x3200xf16> %162 = torch_c.from_builtin_tensor %__auto.blk.17.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.17.ffn_down.weight = util.global.load @__auto.blk.17.ffn_down.weight : tensor<3200x8640xf16> %163 = torch_c.from_builtin_tensor %__auto.blk.17.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.18.attn_norm.weight = util.global.load @__auto.blk.18.attn_norm.weight : tensor<3200xf32> %164 = torch_c.from_builtin_tensor %__auto.blk.18.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.18.attn_q.weight = util.global.load @__auto.blk.18.attn_q.weight : tensor<3200x3200xf16> %165 = torch_c.from_builtin_tensor %__auto.blk.18.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.18.attn_k.weight = util.global.load @__auto.blk.18.attn_k.weight : tensor<3200x3200xf16> %166 = torch_c.from_builtin_tensor %__auto.blk.18.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.18.attn_v.weight = util.global.load @__auto.blk.18.attn_v.weight : tensor<3200x3200xf16> %167 = torch_c.from_builtin_tensor %__auto.blk.18.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.18.attn_output.weight = util.global.load @__auto.blk.18.attn_output.weight : tensor<3200x3200xf16> %168 = torch_c.from_builtin_tensor %__auto.blk.18.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.18.ffn_norm.weight = util.global.load @__auto.blk.18.ffn_norm.weight : tensor<3200xf32> %169 = torch_c.from_builtin_tensor %__auto.blk.18.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.18.ffn_gate.weight = util.global.load @__auto.blk.18.ffn_gate.weight : tensor<8640x3200xf16> %170 = torch_c.from_builtin_tensor %__auto.blk.18.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.18.ffn_up.weight = util.global.load @__auto.blk.18.ffn_up.weight : tensor<8640x3200xf16> %171 = torch_c.from_builtin_tensor %__auto.blk.18.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.18.ffn_down.weight = util.global.load @__auto.blk.18.ffn_down.weight : tensor<3200x8640xf16> %172 = torch_c.from_builtin_tensor %__auto.blk.18.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.19.attn_norm.weight = util.global.load @__auto.blk.19.attn_norm.weight : tensor<3200xf32> %173 = torch_c.from_builtin_tensor %__auto.blk.19.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.19.attn_q.weight = util.global.load @__auto.blk.19.attn_q.weight : tensor<3200x3200xf16> %174 = torch_c.from_builtin_tensor %__auto.blk.19.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.19.attn_k.weight = util.global.load @__auto.blk.19.attn_k.weight : tensor<3200x3200xf16> %175 = torch_c.from_builtin_tensor %__auto.blk.19.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.19.attn_v.weight = util.global.load @__auto.blk.19.attn_v.weight : tensor<3200x3200xf16> %176 = torch_c.from_builtin_tensor %__auto.blk.19.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.19.attn_output.weight = util.global.load @__auto.blk.19.attn_output.weight : tensor<3200x3200xf16> %177 = torch_c.from_builtin_tensor %__auto.blk.19.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.19.ffn_norm.weight = util.global.load @__auto.blk.19.ffn_norm.weight : tensor<3200xf32> %178 = torch_c.from_builtin_tensor %__auto.blk.19.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.19.ffn_gate.weight = util.global.load @__auto.blk.19.ffn_gate.weight : tensor<8640x3200xf16> %179 = torch_c.from_builtin_tensor %__auto.blk.19.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.19.ffn_up.weight = util.global.load @__auto.blk.19.ffn_up.weight : tensor<8640x3200xf16> %180 = torch_c.from_builtin_tensor %__auto.blk.19.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.19.ffn_down.weight = util.global.load @__auto.blk.19.ffn_down.weight : tensor<3200x8640xf16> %181 = torch_c.from_builtin_tensor %__auto.blk.19.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.20.attn_norm.weight = util.global.load @__auto.blk.20.attn_norm.weight : tensor<3200xf32> %182 = torch_c.from_builtin_tensor %__auto.blk.20.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.20.attn_q.weight = util.global.load @__auto.blk.20.attn_q.weight : tensor<3200x3200xf16> %183 = torch_c.from_builtin_tensor %__auto.blk.20.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.20.attn_k.weight = util.global.load @__auto.blk.20.attn_k.weight : tensor<3200x3200xf16> %184 = torch_c.from_builtin_tensor %__auto.blk.20.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.20.attn_v.weight = util.global.load @__auto.blk.20.attn_v.weight : tensor<3200x3200xf16> %185 = torch_c.from_builtin_tensor %__auto.blk.20.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.20.attn_output.weight = util.global.load @__auto.blk.20.attn_output.weight : tensor<3200x3200xf16> %186 = torch_c.from_builtin_tensor %__auto.blk.20.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.20.ffn_norm.weight = util.global.load @__auto.blk.20.ffn_norm.weight : tensor<3200xf32> %187 = torch_c.from_builtin_tensor %__auto.blk.20.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.20.ffn_gate.weight = util.global.load @__auto.blk.20.ffn_gate.weight : tensor<8640x3200xf16> %188 = torch_c.from_builtin_tensor %__auto.blk.20.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.20.ffn_up.weight = util.global.load @__auto.blk.20.ffn_up.weight : tensor<8640x3200xf16> %189 = torch_c.from_builtin_tensor %__auto.blk.20.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.20.ffn_down.weight = util.global.load @__auto.blk.20.ffn_down.weight : tensor<3200x8640xf16> %190 = torch_c.from_builtin_tensor %__auto.blk.20.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.21.attn_norm.weight = util.global.load @__auto.blk.21.attn_norm.weight : tensor<3200xf32> %191 = torch_c.from_builtin_tensor %__auto.blk.21.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.21.attn_q.weight = util.global.load @__auto.blk.21.attn_q.weight : tensor<3200x3200xf16> %192 = torch_c.from_builtin_tensor %__auto.blk.21.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.21.attn_k.weight = util.global.load @__auto.blk.21.attn_k.weight : tensor<3200x3200xf16> %193 = torch_c.from_builtin_tensor %__auto.blk.21.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.21.attn_v.weight = util.global.load @__auto.blk.21.attn_v.weight : tensor<3200x3200xf16> %194 = torch_c.from_builtin_tensor %__auto.blk.21.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.21.attn_output.weight = util.global.load @__auto.blk.21.attn_output.weight : tensor<3200x3200xf16> %195 = torch_c.from_builtin_tensor %__auto.blk.21.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.21.ffn_norm.weight = util.global.load @__auto.blk.21.ffn_norm.weight : tensor<3200xf32> %196 = torch_c.from_builtin_tensor %__auto.blk.21.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.21.ffn_gate.weight = util.global.load @__auto.blk.21.ffn_gate.weight : tensor<8640x3200xf16> %197 = torch_c.from_builtin_tensor %__auto.blk.21.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.21.ffn_up.weight = util.global.load @__auto.blk.21.ffn_up.weight : tensor<8640x3200xf16> %198 = torch_c.from_builtin_tensor %__auto.blk.21.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.21.ffn_down.weight = util.global.load @__auto.blk.21.ffn_down.weight : tensor<3200x8640xf16> %199 = torch_c.from_builtin_tensor %__auto.blk.21.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.22.attn_norm.weight = util.global.load @__auto.blk.22.attn_norm.weight : tensor<3200xf32> %200 = torch_c.from_builtin_tensor %__auto.blk.22.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.22.attn_q.weight = util.global.load @__auto.blk.22.attn_q.weight : tensor<3200x3200xf16> %201 = torch_c.from_builtin_tensor %__auto.blk.22.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.22.attn_k.weight = util.global.load @__auto.blk.22.attn_k.weight : tensor<3200x3200xf16> %202 = torch_c.from_builtin_tensor %__auto.blk.22.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.22.attn_v.weight = util.global.load @__auto.blk.22.attn_v.weight : tensor<3200x3200xf16> %203 = torch_c.from_builtin_tensor %__auto.blk.22.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.22.attn_output.weight = util.global.load @__auto.blk.22.attn_output.weight : tensor<3200x3200xf16> %204 = torch_c.from_builtin_tensor %__auto.blk.22.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.22.ffn_norm.weight = util.global.load @__auto.blk.22.ffn_norm.weight : tensor<3200xf32> %205 = torch_c.from_builtin_tensor %__auto.blk.22.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.22.ffn_gate.weight = util.global.load @__auto.blk.22.ffn_gate.weight : tensor<8640x3200xf16> %206 = torch_c.from_builtin_tensor %__auto.blk.22.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.22.ffn_up.weight = util.global.load @__auto.blk.22.ffn_up.weight : tensor<8640x3200xf16> %207 = torch_c.from_builtin_tensor %__auto.blk.22.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.22.ffn_down.weight = util.global.load @__auto.blk.22.ffn_down.weight : tensor<3200x8640xf16> %208 = torch_c.from_builtin_tensor %__auto.blk.22.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.23.attn_norm.weight = util.global.load @__auto.blk.23.attn_norm.weight : tensor<3200xf32> %209 = torch_c.from_builtin_tensor %__auto.blk.23.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.23.attn_q.weight = util.global.load @__auto.blk.23.attn_q.weight : tensor<3200x3200xf16> %210 = torch_c.from_builtin_tensor %__auto.blk.23.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.23.attn_k.weight = util.global.load @__auto.blk.23.attn_k.weight : tensor<3200x3200xf16> %211 = torch_c.from_builtin_tensor %__auto.blk.23.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.23.attn_v.weight = util.global.load @__auto.blk.23.attn_v.weight : tensor<3200x3200xf16> %212 = torch_c.from_builtin_tensor %__auto.blk.23.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.23.attn_output.weight = util.global.load @__auto.blk.23.attn_output.weight : tensor<3200x3200xf16> %213 = torch_c.from_builtin_tensor %__auto.blk.23.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.23.ffn_norm.weight = util.global.load @__auto.blk.23.ffn_norm.weight : tensor<3200xf32> %214 = torch_c.from_builtin_tensor %__auto.blk.23.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.23.ffn_gate.weight = util.global.load @__auto.blk.23.ffn_gate.weight : tensor<8640x3200xf16> %215 = torch_c.from_builtin_tensor %__auto.blk.23.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.23.ffn_up.weight = util.global.load @__auto.blk.23.ffn_up.weight : tensor<8640x3200xf16> %216 = torch_c.from_builtin_tensor %__auto.blk.23.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.23.ffn_down.weight = util.global.load @__auto.blk.23.ffn_down.weight : tensor<3200x8640xf16> %217 = torch_c.from_builtin_tensor %__auto.blk.23.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.24.attn_norm.weight = util.global.load @__auto.blk.24.attn_norm.weight : tensor<3200xf32> %218 = torch_c.from_builtin_tensor %__auto.blk.24.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.24.attn_q.weight = util.global.load @__auto.blk.24.attn_q.weight : tensor<3200x3200xf16> %219 = torch_c.from_builtin_tensor %__auto.blk.24.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.24.attn_k.weight = util.global.load @__auto.blk.24.attn_k.weight : tensor<3200x3200xf16> %220 = torch_c.from_builtin_tensor %__auto.blk.24.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.24.attn_v.weight = util.global.load @__auto.blk.24.attn_v.weight : tensor<3200x3200xf16> %221 = torch_c.from_builtin_tensor %__auto.blk.24.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.24.attn_output.weight = util.global.load @__auto.blk.24.attn_output.weight : tensor<3200x3200xf16> %222 = torch_c.from_builtin_tensor %__auto.blk.24.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.24.ffn_norm.weight = util.global.load @__auto.blk.24.ffn_norm.weight : tensor<3200xf32> %223 = torch_c.from_builtin_tensor %__auto.blk.24.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.24.ffn_gate.weight = util.global.load @__auto.blk.24.ffn_gate.weight : tensor<8640x3200xf16> %224 = torch_c.from_builtin_tensor %__auto.blk.24.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.24.ffn_up.weight = util.global.load @__auto.blk.24.ffn_up.weight : tensor<8640x3200xf16> %225 = torch_c.from_builtin_tensor %__auto.blk.24.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.24.ffn_down.weight = util.global.load @__auto.blk.24.ffn_down.weight : tensor<3200x8640xf16> %226 = torch_c.from_builtin_tensor %__auto.blk.24.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.blk.25.attn_norm.weight = util.global.load @__auto.blk.25.attn_norm.weight : tensor<3200xf32> %227 = torch_c.from_builtin_tensor %__auto.blk.25.attn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.25.attn_q.weight = util.global.load @__auto.blk.25.attn_q.weight : tensor<3200x3200xf16> %228 = torch_c.from_builtin_tensor %__auto.blk.25.attn_q.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.25.attn_k.weight = util.global.load @__auto.blk.25.attn_k.weight : tensor<3200x3200xf16> %229 = torch_c.from_builtin_tensor %__auto.blk.25.attn_k.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.25.attn_v.weight = util.global.load @__auto.blk.25.attn_v.weight : tensor<3200x3200xf16> %230 = torch_c.from_builtin_tensor %__auto.blk.25.attn_v.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.25.attn_output.weight = util.global.load @__auto.blk.25.attn_output.weight : tensor<3200x3200xf16> %231 = torch_c.from_builtin_tensor %__auto.blk.25.attn_output.weight : tensor<3200x3200xf16> -> !torch.vtensor<[3200,3200],f16> %__auto.blk.25.ffn_norm.weight = util.global.load @__auto.blk.25.ffn_norm.weight : tensor<3200xf32> %232 = torch_c.from_builtin_tensor %__auto.blk.25.ffn_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.blk.25.ffn_gate.weight = util.global.load @__auto.blk.25.ffn_gate.weight : tensor<8640x3200xf16> %233 = torch_c.from_builtin_tensor %__auto.blk.25.ffn_gate.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.25.ffn_up.weight = util.global.load @__auto.blk.25.ffn_up.weight : tensor<8640x3200xf16> %234 = torch_c.from_builtin_tensor %__auto.blk.25.ffn_up.weight : tensor<8640x3200xf16> -> !torch.vtensor<[8640,3200],f16> %__auto.blk.25.ffn_down.weight = util.global.load @__auto.blk.25.ffn_down.weight : tensor<3200x8640xf16> %235 = torch_c.from_builtin_tensor %__auto.blk.25.ffn_down.weight : tensor<3200x8640xf16> -> !torch.vtensor<[3200,8640],f16> %__auto.output_norm.weight = util.global.load @__auto.output_norm.weight : tensor<3200xf32> %236 = torch_c.from_builtin_tensor %__auto.output_norm.weight : tensor<3200xf32> -> !torch.vtensor<[3200],f32> %__auto.output.weight = util.global.load @__auto.output.weight : tensor<32000x3200xf16> %237 = torch_c.from_builtin_tensor %__auto.output.weight : tensor<32000x3200xf16> -> !torch.vtensor<[32000,3200],f16> %238 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %239 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %240 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %241 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %242 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %243 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %244 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %245 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %246 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %247 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %248 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %249 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %250 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %251 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %252 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %253 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %254 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %255 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %256 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %257 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %258 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %259 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %260 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %261 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %262 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %263 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %264 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %265 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %266 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %267 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %268 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %269 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %270 = torch.vtensor.literal(dense<2> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %271 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %272 = torch.vtensor.literal(dense<2> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %273 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %274 = torch.vtensor.literal(dense<2> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %275 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %276 = torch.vtensor.literal(dense<2> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %277 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %278 = torch.vtensor.literal(dense<2> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %279 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %280 = torch.vtensor.literal(dense<2> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %281 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %282 = torch.vtensor.literal(dense<2> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %283 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %284 = torch.vtensor.literal(dense<2> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %285 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %286 = torch.vtensor.literal(dense<3> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %287 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %288 = torch.vtensor.literal(dense<3> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %289 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %290 = torch.vtensor.literal(dense<3> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %291 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %292 = torch.vtensor.literal(dense<3> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %293 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %294 = torch.vtensor.literal(dense<3> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %295 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %296 = torch.vtensor.literal(dense<3> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %297 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %298 = torch.vtensor.literal(dense<3> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %299 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %300 = torch.vtensor.literal(dense<3> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %301 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %302 = torch.vtensor.literal(dense<4> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %303 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %304 = torch.vtensor.literal(dense<4> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %305 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %306 = torch.vtensor.literal(dense<4> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %307 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %308 = torch.vtensor.literal(dense<4> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %309 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %310 = torch.vtensor.literal(dense<4> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %311 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %312 = torch.vtensor.literal(dense<4> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %313 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %314 = torch.vtensor.literal(dense<4> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %315 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %316 = torch.vtensor.literal(dense<4> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %317 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %318 = torch.vtensor.literal(dense<5> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %319 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %320 = torch.vtensor.literal(dense<5> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %321 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %322 = torch.vtensor.literal(dense<5> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %323 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %324 = torch.vtensor.literal(dense<5> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %325 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %326 = torch.vtensor.literal(dense<5> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %327 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %328 = torch.vtensor.literal(dense<5> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %329 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %330 = torch.vtensor.literal(dense<5> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %331 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %332 = torch.vtensor.literal(dense<5> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %333 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %334 = torch.vtensor.literal(dense<6> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %335 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %336 = torch.vtensor.literal(dense<6> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %337 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %338 = torch.vtensor.literal(dense<6> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %339 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %340 = torch.vtensor.literal(dense<6> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %341 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %342 = torch.vtensor.literal(dense<6> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %343 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %344 = torch.vtensor.literal(dense<6> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %345 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %346 = torch.vtensor.literal(dense<6> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %347 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %348 = torch.vtensor.literal(dense<6> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %349 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %350 = torch.vtensor.literal(dense<7> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %351 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %352 = torch.vtensor.literal(dense<7> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %353 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %354 = torch.vtensor.literal(dense<7> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %355 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %356 = torch.vtensor.literal(dense<7> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %357 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %358 = torch.vtensor.literal(dense<7> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %359 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %360 = torch.vtensor.literal(dense<7> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %361 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %362 = torch.vtensor.literal(dense<7> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %363 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %364 = torch.vtensor.literal(dense<7> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %365 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %366 = torch.vtensor.literal(dense<8> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %367 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %368 = torch.vtensor.literal(dense<8> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %369 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %370 = torch.vtensor.literal(dense<8> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %371 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %372 = torch.vtensor.literal(dense<8> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %373 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %374 = torch.vtensor.literal(dense<8> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %375 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %376 = torch.vtensor.literal(dense<8> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %377 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %378 = torch.vtensor.literal(dense<8> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %379 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %380 = torch.vtensor.literal(dense<8> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %381 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %382 = torch.vtensor.literal(dense<9> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %383 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %384 = torch.vtensor.literal(dense<9> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %385 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %386 = torch.vtensor.literal(dense<9> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %387 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %388 = torch.vtensor.literal(dense<9> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %389 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %390 = torch.vtensor.literal(dense<9> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %391 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %392 = torch.vtensor.literal(dense<9> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %393 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %394 = torch.vtensor.literal(dense<9> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %395 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %396 = torch.vtensor.literal(dense<9> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %397 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %398 = torch.vtensor.literal(dense<10> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %399 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %400 = torch.vtensor.literal(dense<10> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %401 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %402 = torch.vtensor.literal(dense<10> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %403 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %404 = torch.vtensor.literal(dense<10> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %405 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %406 = torch.vtensor.literal(dense<10> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %407 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %408 = torch.vtensor.literal(dense<10> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %409 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %410 = torch.vtensor.literal(dense<10> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %411 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %412 = torch.vtensor.literal(dense<10> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %413 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %414 = torch.vtensor.literal(dense<11> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %415 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %416 = torch.vtensor.literal(dense<11> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %417 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %418 = torch.vtensor.literal(dense<11> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %419 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %420 = torch.vtensor.literal(dense<11> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %421 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %422 = torch.vtensor.literal(dense<11> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %423 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %424 = torch.vtensor.literal(dense<11> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %425 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %426 = torch.vtensor.literal(dense<11> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %427 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %428 = torch.vtensor.literal(dense<11> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %429 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %430 = torch.vtensor.literal(dense<12> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %431 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %432 = torch.vtensor.literal(dense<12> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %433 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %434 = torch.vtensor.literal(dense<12> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %435 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %436 = torch.vtensor.literal(dense<12> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %437 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %438 = torch.vtensor.literal(dense<12> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %439 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %440 = torch.vtensor.literal(dense<12> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %441 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %442 = torch.vtensor.literal(dense<12> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %443 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %444 = torch.vtensor.literal(dense<12> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %445 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %446 = torch.vtensor.literal(dense<13> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %447 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %448 = torch.vtensor.literal(dense<13> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %449 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %450 = torch.vtensor.literal(dense<13> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %451 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %452 = torch.vtensor.literal(dense<13> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %453 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %454 = torch.vtensor.literal(dense<13> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %455 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %456 = torch.vtensor.literal(dense<13> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %457 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %458 = torch.vtensor.literal(dense<13> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %459 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %460 = torch.vtensor.literal(dense<13> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %461 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %462 = torch.vtensor.literal(dense<14> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %463 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %464 = torch.vtensor.literal(dense<14> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %465 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %466 = torch.vtensor.literal(dense<14> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %467 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %468 = torch.vtensor.literal(dense<14> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %469 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %470 = torch.vtensor.literal(dense<14> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %471 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %472 = torch.vtensor.literal(dense<14> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %473 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %474 = torch.vtensor.literal(dense<14> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %475 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %476 = torch.vtensor.literal(dense<14> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %477 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %478 = torch.vtensor.literal(dense<15> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %479 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %480 = torch.vtensor.literal(dense<15> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %481 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %482 = torch.vtensor.literal(dense<15> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %483 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %484 = torch.vtensor.literal(dense<15> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %485 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %486 = torch.vtensor.literal(dense<15> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %487 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %488 = torch.vtensor.literal(dense<15> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %489 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %490 = torch.vtensor.literal(dense<15> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %491 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %492 = torch.vtensor.literal(dense<15> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %493 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %494 = torch.vtensor.literal(dense<16> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %495 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %496 = torch.vtensor.literal(dense<16> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %497 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %498 = torch.vtensor.literal(dense<16> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %499 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %500 = torch.vtensor.literal(dense<16> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %501 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %502 = torch.vtensor.literal(dense<16> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %503 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %504 = torch.vtensor.literal(dense<16> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %505 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %506 = torch.vtensor.literal(dense<16> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %507 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %508 = torch.vtensor.literal(dense<16> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %509 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %510 = torch.vtensor.literal(dense<17> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %511 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %512 = torch.vtensor.literal(dense<17> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %513 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %514 = torch.vtensor.literal(dense<17> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %515 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %516 = torch.vtensor.literal(dense<17> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %517 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %518 = torch.vtensor.literal(dense<17> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %519 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %520 = torch.vtensor.literal(dense<17> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %521 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %522 = torch.vtensor.literal(dense<17> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %523 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %524 = torch.vtensor.literal(dense<17> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %525 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %526 = torch.vtensor.literal(dense<18> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %527 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %528 = torch.vtensor.literal(dense<18> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %529 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %530 = torch.vtensor.literal(dense<18> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %531 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %532 = torch.vtensor.literal(dense<18> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %533 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %534 = torch.vtensor.literal(dense<18> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %535 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %536 = torch.vtensor.literal(dense<18> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %537 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %538 = torch.vtensor.literal(dense<18> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %539 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %540 = torch.vtensor.literal(dense<18> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %541 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %542 = torch.vtensor.literal(dense<19> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %543 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %544 = torch.vtensor.literal(dense<19> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %545 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %546 = torch.vtensor.literal(dense<19> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %547 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %548 = torch.vtensor.literal(dense<19> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %549 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %550 = torch.vtensor.literal(dense<19> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %551 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %552 = torch.vtensor.literal(dense<19> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %553 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %554 = torch.vtensor.literal(dense<19> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %555 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %556 = torch.vtensor.literal(dense<19> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %557 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %558 = torch.vtensor.literal(dense<20> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %559 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %560 = torch.vtensor.literal(dense<20> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %561 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %562 = torch.vtensor.literal(dense<20> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %563 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %564 = torch.vtensor.literal(dense<20> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %565 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %566 = torch.vtensor.literal(dense<20> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %567 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %568 = torch.vtensor.literal(dense<20> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %569 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %570 = torch.vtensor.literal(dense<20> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %571 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %572 = torch.vtensor.literal(dense<20> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %573 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %574 = torch.vtensor.literal(dense<21> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %575 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %576 = torch.vtensor.literal(dense<21> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %577 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %578 = torch.vtensor.literal(dense<21> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %579 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %580 = torch.vtensor.literal(dense<21> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %581 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %582 = torch.vtensor.literal(dense<21> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %583 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %584 = torch.vtensor.literal(dense<21> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %585 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %586 = torch.vtensor.literal(dense<21> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %587 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %588 = torch.vtensor.literal(dense<21> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %589 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %590 = torch.vtensor.literal(dense<22> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %591 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %592 = torch.vtensor.literal(dense<22> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %593 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %594 = torch.vtensor.literal(dense<22> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %595 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %596 = torch.vtensor.literal(dense<22> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %597 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %598 = torch.vtensor.literal(dense<22> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %599 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %600 = torch.vtensor.literal(dense<22> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %601 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %602 = torch.vtensor.literal(dense<22> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %603 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %604 = torch.vtensor.literal(dense<22> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %605 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %606 = torch.vtensor.literal(dense<23> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %607 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %608 = torch.vtensor.literal(dense<23> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %609 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %610 = torch.vtensor.literal(dense<23> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %611 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %612 = torch.vtensor.literal(dense<23> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %613 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %614 = torch.vtensor.literal(dense<23> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %615 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %616 = torch.vtensor.literal(dense<23> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %617 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %618 = torch.vtensor.literal(dense<23> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %619 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %620 = torch.vtensor.literal(dense<23> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %621 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %622 = torch.vtensor.literal(dense<24> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %623 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %624 = torch.vtensor.literal(dense<24> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %625 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %626 = torch.vtensor.literal(dense<24> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %627 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %628 = torch.vtensor.literal(dense<24> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %629 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %630 = torch.vtensor.literal(dense<24> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %631 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %632 = torch.vtensor.literal(dense<24> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %633 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %634 = torch.vtensor.literal(dense<24> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %635 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %636 = torch.vtensor.literal(dense<24> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %637 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %638 = torch.vtensor.literal(dense<25> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %639 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %640 = torch.vtensor.literal(dense<25> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %641 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %642 = torch.vtensor.literal(dense<25> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %643 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %644 = torch.vtensor.literal(dense<25> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %645 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %646 = torch.vtensor.literal(dense<25> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %647 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %648 = torch.vtensor.literal(dense<25> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %649 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %650 = torch.vtensor.literal(dense<25> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %651 = torch.vtensor.literal(dense<0> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %652 = torch.vtensor.literal(dense<25> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %653 = torch.vtensor.literal(dense<1> : tensor<1xsi64>) : !torch.vtensor<[1],si64> %654 = torch.copy.to_vtensor %arg4 : !torch.vtensor<[?,2662400],f32> %int1 = torch.constant.int 1 %655 = torch.aten.size.int %arg3, %int1 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.int %int16 = torch.constant.int 16 %656 = torch.aten.mul.int %655, %int16 : !torch.int, !torch.int -> !torch.int %int0 = torch.constant.int 0 %int1_0 = torch.constant.int 1 %none = torch.constant.none %none_1 = torch.constant.none %cpu = torch.constant.device "cpu" %false = torch.constant.bool false %657 = torch.aten.arange.start_step %int0, %656, %int1_0, %none, %none_1, %cpu, %false : !torch.int, !torch.int, !torch.int, !torch.none, !torch.none, !torch.Device, !torch.bool -> !torch.vtensor<[?],si64> %int-1 = torch.constant.int -1 %658 = torch.aten.unsqueeze %arg1, %int-1 : !torch.vtensor<[4],si64>, !torch.int -> !torch.vtensor<[4,1],si64> %659 = torch.aten.ge.Tensor %657, %658 : !torch.vtensor<[?],si64>, !torch.vtensor<[4,1],si64> -> !torch.vtensor<[4,?],i1> %int6 = torch.constant.int 6 %none_2 = torch.constant.none %none_3 = torch.constant.none %false_4 = torch.constant.bool false %none_5 = torch.constant.none %660 = torch.aten.zeros_like %659, %int6, %none_2, %none_3, %false_4, %none_5 : !torch.vtensor<[4,?],i1>, !torch.int, !torch.none, !torch.none, !torch.bool, !torch.none -> !torch.vtensor<[4,?],f32> %float-Inf = torch.constant.float 0xFFF0000000000000 %int6_6 = torch.constant.int 6 %int0_7 = torch.constant.int 0 %cpu_8 = torch.constant.device "cpu" %none_9 = torch.constant.none %661 = torch.aten.scalar_tensor %float-Inf, %int6_6, %int0_7, %cpu_8, %none_9 : !torch.float, !torch.int, !torch.int, !torch.Device, !torch.none -> !torch.vtensor<[],f32> %662 = torch.aten.where.self %659, %661, %660 : !torch.vtensor<[4,?],i1>, !torch.vtensor<[],f32>, !torch.vtensor<[4,?],f32> -> !torch.vtensor<[4,?],f32> %int0_10 = torch.constant.int 0 %int1_11 = torch.constant.int 1 %none_12 = torch.constant.none %none_13 = torch.constant.none %cpu_14 = torch.constant.device "cpu" %false_15 = torch.constant.bool false %663 = torch.aten.arange.start %int0_10, %int1_11, %none_12, %none_13, %cpu_14, %false_15 : !torch.int, !torch.int, !torch.none, !torch.none, !torch.Device, !torch.bool -> !torch.vtensor<[1],si64> %int0_16 = torch.constant.int 0 %664 = torch.aten.unsqueeze %663, %int0_16 : !torch.vtensor<[1],si64>, !torch.int -> !torch.vtensor<[1,1],si64> %int1_17 = torch.constant.int 1 %665 = torch.aten.unsqueeze %arg2, %int1_17 : !torch.vtensor<[4],si64>, !torch.int -> !torch.vtensor<[4,1],si64> %int1_18 = torch.constant.int 1 %666 = torch.aten.add.Tensor %664, %665, %int1_18 : !torch.vtensor<[1,1],si64>, !torch.vtensor<[4,1],si64>, !torch.int -> !torch.vtensor<[4,1],si64> %667 = torch.prim.ListConstruct %666 : (!torch.vtensor<[4,1],si64>) -> !torch.list> %668 = torch.aten.index.Tensor %0, %667 : !torch.vtensor<[2048,50],complex>, !torch.list> -> !torch.vtensor<[4,1,50],complex> %int2 = torch.constant.int 2 %669 = torch.aten.unsqueeze %668, %int2 : !torch.vtensor<[4,1,50],complex>, !torch.int -> !torch.vtensor<[4,1,1,50],complex> %int4 = torch.constant.int 4 %int2048 = torch.constant.int 2048 %int32 = torch.constant.int 32 %int100 = torch.constant.int 100 %670 = torch.prim.ListConstruct %int4, %int2048, %int32, %int100 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %int6_19 = torch.constant.int 6 %none_20 = torch.constant.none %cpu_21 = torch.constant.device "cpu" %false_22 = torch.constant.bool false %none_23 = torch.constant.none %671 = torch.aten.empty.memory_format %670, %int6_19, %none_20, %cpu_21, %false_22, %none_23 : !torch.list, !torch.int, !torch.none, !torch.Device, !torch.bool, !torch.none -> !torch.vtensor<[4,2048,32,100],f32> %int4_24 = torch.constant.int 4 %int2048_25 = torch.constant.int 2048 %int32_26 = torch.constant.int 32 %int100_27 = torch.constant.int 100 %672 = torch.prim.ListConstruct %int4_24, %int2048_25, %int32_26, %int100_27 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %int6_28 = torch.constant.int 6 %none_29 = torch.constant.none %cpu_30 = torch.constant.device "cpu" %false_31 = torch.constant.bool false %none_32 = torch.constant.none %673 = torch.aten.empty.memory_format %672, %int6_28, %none_29, %cpu_30, %false_31, %none_32 : !torch.list, !torch.int, !torch.none, !torch.Device, !torch.bool, !torch.none -> !torch.vtensor<[4,2048,32,100],f32> %int6_33 = torch.constant.int 6 %674 = torch.prims.convert_element_type %1, %int6_33 : !torch.vtensor<[32000,3200],f16>, !torch.int -> !torch.vtensor<[32000,3200],f32> %int-1_34 = torch.constant.int -1 %false_35 = torch.constant.bool false %false_36 = torch.constant.bool false %675 = torch.aten.embedding %674, %arg0, %int-1_34, %false_35, %false_36 : !torch.vtensor<[32000,3200],f32>, !torch.vtensor<[4,1],si64>, !torch.int, !torch.bool, !torch.bool -> !torch.vtensor<[4,1,3200],f32> %int2_37 = torch.constant.int 2 %676 = torch.aten.pow.Tensor_Scalar %675, %int2_37 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_38 = torch.constant.int -1 %677 = torch.prim.ListConstruct %int-1_38 : (!torch.int) -> !torch.list %true = torch.constant.bool true %none_39 = torch.constant.none %678 = torch.aten.mean.dim %676, %677, %true, %none_39 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07 = torch.constant.float 9.9999999747524271E-7 %int1_40 = torch.constant.int 1 %679 = torch.aten.add.Scalar %678, %float9.999990e-07, %int1_40 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %680 = torch.aten.rsqrt %679 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %681 = torch.aten.mul.Tensor %675, %680 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %682 = torch.aten.mul.Tensor %681, %2 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %683 = torch_c.to_builtin_tensor %682 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast = tensor.cast %683 : tensor<4x1x3200xf32> to tensor %684 = torch_c.to_builtin_tensor %3 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %685 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast, %684) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_41 = tensor.cast %685 : tensor to tensor<4x1x3200xf32> %686 = torch_c.from_builtin_tensor %cast_41 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %687 = torch_c.to_builtin_tensor %682 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_42 = tensor.cast %687 : tensor<4x1x3200xf32> to tensor %688 = torch_c.to_builtin_tensor %4 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %689 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_42, %688) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_43 = tensor.cast %689 : tensor to tensor<4x1x3200xf32> %690 = torch_c.from_builtin_tensor %cast_43 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %691 = torch_c.to_builtin_tensor %682 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_44 = tensor.cast %691 : tensor<4x1x3200xf32> to tensor %692 = torch_c.to_builtin_tensor %5 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %693 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_44, %692) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_45 = tensor.cast %693 : tensor to tensor<4x1x3200xf32> %694 = torch_c.from_builtin_tensor %cast_45 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_46 = torch.constant.int 4 %int1_47 = torch.constant.int 1 %int32_48 = torch.constant.int 32 %int100_49 = torch.constant.int 100 %695 = torch.prim.ListConstruct %int4_46, %int1_47, %int32_48, %int100_49 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %696 = torch.aten.view %686, %695 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_50 = torch.constant.int 4 %int1_51 = torch.constant.int 1 %int32_52 = torch.constant.int 32 %int100_53 = torch.constant.int 100 %697 = torch.prim.ListConstruct %int4_50, %int1_51, %int32_52, %int100_53 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %698 = torch.aten.view %690, %697 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_54 = torch.constant.int 4 %int1_55 = torch.constant.int 1 %int32_56 = torch.constant.int 32 %int100_57 = torch.constant.int 100 %699 = torch.prim.ListConstruct %int4_54, %int1_55, %int32_56, %int100_57 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %700 = torch.aten.view %694, %699 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_58 = torch.constant.int 4 %int1_59 = torch.constant.int 1 %int32_60 = torch.constant.int 32 %int-1_61 = torch.constant.int -1 %int2_62 = torch.constant.int 2 %701 = torch.prim.ListConstruct %int4_58, %int1_59, %int32_60, %int-1_61, %int2_62 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %702 = torch.aten.view %696, %701 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %703 = torch.aten.view_as_complex %702 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_63 = torch.constant.int 4 %int1_64 = torch.constant.int 1 %int32_65 = torch.constant.int 32 %int-1_66 = torch.constant.int -1 %int2_67 = torch.constant.int 2 %704 = torch.prim.ListConstruct %int4_63, %int1_64, %int32_65, %int-1_66, %int2_67 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %705 = torch.aten.view %698, %704 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %706 = torch.aten.view_as_complex %705 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %707 = torch.aten.mul.Tensor %703, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %708 = torch.aten.view_as_real %707 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_68 = torch.constant.int 4 %int1_69 = torch.constant.int 1 %int32_70 = torch.constant.int 32 %int100_71 = torch.constant.int 100 %709 = torch.prim.ListConstruct %int4_68, %int1_69, %int32_70, %int100_71 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %710 = torch.aten.view %708, %709 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %711 = torch.aten.mul.Tensor %706, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %712 = torch.aten.view_as_real %711 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_72 = torch.constant.int 4 %int1_73 = torch.constant.int 1 %int32_74 = torch.constant.int 32 %int100_75 = torch.constant.int 100 %713 = torch.prim.ListConstruct %int4_72, %int1_73, %int32_74, %int100_75 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %714 = torch.aten.view %712, %713 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_76 = torch.constant.int 1 %int1_77 = torch.constant.int 1 %715 = torch.aten.add.Scalar %arg2, %int1_76, %int1_77 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int-1_78 = torch.constant.int -1 %int26 = torch.constant.int 26 %int2_79 = torch.constant.int 2 %int16_80 = torch.constant.int 16 %int32_81 = torch.constant.int 32 %int100_82 = torch.constant.int 100 %716 = torch.prim.ListConstruct %int-1_78, %int26, %int2_79, %int16_80, %int32_81, %int100_82 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %717 = torch.aten.view %654, %716 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_83 = torch.constant.int 0 %int0_84 = torch.constant.int 0 %718 = torch.aten.select.int %715, %int0_83, %int0_84 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_85 = torch.constant.int 0 %int0_86 = torch.constant.int 0 %719 = torch.aten.select.int %arg3, %int0_85, %int0_86 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_87 = torch.constant.int 0 %int0_88 = torch.constant.int 0 %int9223372036854775807 = torch.constant.int 9223372036854775807 %int1_89 = torch.constant.int 1 %720 = torch.aten.slice.Tensor %719, %int0_87, %int0_88, %int9223372036854775807, %int1_89 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_90 = torch.constant.int 16 %721 = torch.aten.floor_divide.Scalar %718, %int16_90 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_91 = torch.constant.int 0 %722 = torch.aten.index_select %720, %int0_91, %721 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_92 = torch.constant.int 16 %723 = torch.aten.remainder.Scalar %718, %int16_92 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_93 = torch.constant.none %724 = torch.aten.clone %238, %none_93 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_94 = torch.constant.none %725 = torch.aten.clone %239, %none_94 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_95 = torch.constant.int 0 %726 = torch.aten.unsqueeze %723, %int0_95 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_96 = torch.constant.int 0 %int0_97 = torch.constant.int 0 %727 = torch.aten.select.int %714, %int0_96, %int0_97 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_98 = torch.constant.int 0 %int0_99 = torch.constant.int 0 %728 = torch.aten.select.int %727, %int0_98, %int0_99 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %729 = torch.prim.ListConstruct %722, %724, %725, %726 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_100 = torch.constant.bool false %730 = torch.aten.index_put %717, %729, %728, %false_100 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_101 = torch.constant.int 0 %731 = torch.aten.size.int %654, %int0_101 : !torch.vtensor<[?,2662400],f32>, !torch.int -> !torch.int %int2662400 = torch.constant.int 2662400 %732 = torch.prim.ListConstruct %731, %int2662400 : (!torch.int, !torch.int) -> !torch.list %733 = torch.aten.view %730, %732 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_102 = torch.constant.int -1 %int26_103 = torch.constant.int 26 %int2_104 = torch.constant.int 2 %int16_105 = torch.constant.int 16 %int32_106 = torch.constant.int 32 %int100_107 = torch.constant.int 100 %734 = torch.prim.ListConstruct %int-1_102, %int26_103, %int2_104, %int16_105, %int32_106, %int100_107 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %735 = torch.aten.view %733, %734 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_108 = torch.constant.none %736 = torch.aten.clone %240, %none_108 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_109 = torch.constant.none %737 = torch.aten.clone %241, %none_109 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_110 = torch.constant.int 0 %738 = torch.aten.unsqueeze %723, %int0_110 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_111 = torch.constant.int 0 %int0_112 = torch.constant.int 0 %739 = torch.aten.select.int %700, %int0_111, %int0_112 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_113 = torch.constant.int 0 %int0_114 = torch.constant.int 0 %740 = torch.aten.select.int %739, %int0_113, %int0_114 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %741 = torch.prim.ListConstruct %722, %736, %737, %738 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_115 = torch.constant.bool false %742 = torch.aten.index_put %735, %741, %740, %false_115 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_116 = torch.constant.int 2662400 %743 = torch.prim.ListConstruct %731, %int2662400_116 : (!torch.int, !torch.int) -> !torch.list %744 = torch.aten.view %742, %743 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_117 = torch.constant.int -1 %int26_118 = torch.constant.int 26 %int2_119 = torch.constant.int 2 %int16_120 = torch.constant.int 16 %int32_121 = torch.constant.int 32 %int100_122 = torch.constant.int 100 %745 = torch.prim.ListConstruct %int-1_117, %int26_118, %int2_119, %int16_120, %int32_121, %int100_122 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %746 = torch.aten.view %744, %745 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_123 = torch.constant.int 0 %int1_124 = torch.constant.int 1 %747 = torch.aten.select.int %715, %int0_123, %int1_124 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_125 = torch.constant.int 0 %int1_126 = torch.constant.int 1 %748 = torch.aten.select.int %arg3, %int0_125, %int1_126 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_127 = torch.constant.int 0 %int0_128 = torch.constant.int 0 %int9223372036854775807_129 = torch.constant.int 9223372036854775807 %int1_130 = torch.constant.int 1 %749 = torch.aten.slice.Tensor %748, %int0_127, %int0_128, %int9223372036854775807_129, %int1_130 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_131 = torch.constant.int 16 %750 = torch.aten.floor_divide.Scalar %747, %int16_131 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_132 = torch.constant.int 0 %751 = torch.aten.index_select %749, %int0_132, %750 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_133 = torch.constant.int 16 %752 = torch.aten.remainder.Scalar %747, %int16_133 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_134 = torch.constant.none %753 = torch.aten.clone %242, %none_134 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_135 = torch.constant.none %754 = torch.aten.clone %243, %none_135 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_136 = torch.constant.int 0 %755 = torch.aten.unsqueeze %752, %int0_136 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_137 = torch.constant.int 0 %int1_138 = torch.constant.int 1 %756 = torch.aten.select.int %714, %int0_137, %int1_138 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_139 = torch.constant.int 0 %int0_140 = torch.constant.int 0 %757 = torch.aten.select.int %756, %int0_139, %int0_140 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %758 = torch.prim.ListConstruct %751, %753, %754, %755 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_141 = torch.constant.bool false %759 = torch.aten.index_put %746, %758, %757, %false_141 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_142 = torch.constant.int 2662400 %760 = torch.prim.ListConstruct %731, %int2662400_142 : (!torch.int, !torch.int) -> !torch.list %761 = torch.aten.view %759, %760 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_143 = torch.constant.int -1 %int26_144 = torch.constant.int 26 %int2_145 = torch.constant.int 2 %int16_146 = torch.constant.int 16 %int32_147 = torch.constant.int 32 %int100_148 = torch.constant.int 100 %762 = torch.prim.ListConstruct %int-1_143, %int26_144, %int2_145, %int16_146, %int32_147, %int100_148 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %763 = torch.aten.view %761, %762 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_149 = torch.constant.none %764 = torch.aten.clone %244, %none_149 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_150 = torch.constant.none %765 = torch.aten.clone %245, %none_150 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_151 = torch.constant.int 0 %766 = torch.aten.unsqueeze %752, %int0_151 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_152 = torch.constant.int 0 %int1_153 = torch.constant.int 1 %767 = torch.aten.select.int %700, %int0_152, %int1_153 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_154 = torch.constant.int 0 %int0_155 = torch.constant.int 0 %768 = torch.aten.select.int %767, %int0_154, %int0_155 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %769 = torch.prim.ListConstruct %751, %764, %765, %766 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_156 = torch.constant.bool false %770 = torch.aten.index_put %763, %769, %768, %false_156 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_157 = torch.constant.int 2662400 %771 = torch.prim.ListConstruct %731, %int2662400_157 : (!torch.int, !torch.int) -> !torch.list %772 = torch.aten.view %770, %771 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_158 = torch.constant.int -1 %int26_159 = torch.constant.int 26 %int2_160 = torch.constant.int 2 %int16_161 = torch.constant.int 16 %int32_162 = torch.constant.int 32 %int100_163 = torch.constant.int 100 %773 = torch.prim.ListConstruct %int-1_158, %int26_159, %int2_160, %int16_161, %int32_162, %int100_163 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %774 = torch.aten.view %772, %773 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_164 = torch.constant.int 0 %int2_165 = torch.constant.int 2 %775 = torch.aten.select.int %715, %int0_164, %int2_165 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_166 = torch.constant.int 0 %int2_167 = torch.constant.int 2 %776 = torch.aten.select.int %arg3, %int0_166, %int2_167 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_168 = torch.constant.int 0 %int0_169 = torch.constant.int 0 %int9223372036854775807_170 = torch.constant.int 9223372036854775807 %int1_171 = torch.constant.int 1 %777 = torch.aten.slice.Tensor %776, %int0_168, %int0_169, %int9223372036854775807_170, %int1_171 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_172 = torch.constant.int 16 %778 = torch.aten.floor_divide.Scalar %775, %int16_172 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_173 = torch.constant.int 0 %779 = torch.aten.index_select %777, %int0_173, %778 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_174 = torch.constant.int 16 %780 = torch.aten.remainder.Scalar %775, %int16_174 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_175 = torch.constant.none %781 = torch.aten.clone %246, %none_175 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_176 = torch.constant.none %782 = torch.aten.clone %247, %none_176 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_177 = torch.constant.int 0 %783 = torch.aten.unsqueeze %780, %int0_177 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_178 = torch.constant.int 0 %int2_179 = torch.constant.int 2 %784 = torch.aten.select.int %714, %int0_178, %int2_179 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_180 = torch.constant.int 0 %int0_181 = torch.constant.int 0 %785 = torch.aten.select.int %784, %int0_180, %int0_181 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %786 = torch.prim.ListConstruct %779, %781, %782, %783 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_182 = torch.constant.bool false %787 = torch.aten.index_put %774, %786, %785, %false_182 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_183 = torch.constant.int 2662400 %788 = torch.prim.ListConstruct %731, %int2662400_183 : (!torch.int, !torch.int) -> !torch.list %789 = torch.aten.view %787, %788 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_184 = torch.constant.int -1 %int26_185 = torch.constant.int 26 %int2_186 = torch.constant.int 2 %int16_187 = torch.constant.int 16 %int32_188 = torch.constant.int 32 %int100_189 = torch.constant.int 100 %790 = torch.prim.ListConstruct %int-1_184, %int26_185, %int2_186, %int16_187, %int32_188, %int100_189 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %791 = torch.aten.view %789, %790 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_190 = torch.constant.none %792 = torch.aten.clone %248, %none_190 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_191 = torch.constant.none %793 = torch.aten.clone %249, %none_191 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_192 = torch.constant.int 0 %794 = torch.aten.unsqueeze %780, %int0_192 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_193 = torch.constant.int 0 %int2_194 = torch.constant.int 2 %795 = torch.aten.select.int %700, %int0_193, %int2_194 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_195 = torch.constant.int 0 %int0_196 = torch.constant.int 0 %796 = torch.aten.select.int %795, %int0_195, %int0_196 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %797 = torch.prim.ListConstruct %779, %792, %793, %794 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_197 = torch.constant.bool false %798 = torch.aten.index_put %791, %797, %796, %false_197 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_198 = torch.constant.int 2662400 %799 = torch.prim.ListConstruct %731, %int2662400_198 : (!torch.int, !torch.int) -> !torch.list %800 = torch.aten.view %798, %799 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_199 = torch.constant.int -1 %int26_200 = torch.constant.int 26 %int2_201 = torch.constant.int 2 %int16_202 = torch.constant.int 16 %int32_203 = torch.constant.int 32 %int100_204 = torch.constant.int 100 %801 = torch.prim.ListConstruct %int-1_199, %int26_200, %int2_201, %int16_202, %int32_203, %int100_204 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %802 = torch.aten.view %800, %801 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_205 = torch.constant.int 0 %int3 = torch.constant.int 3 %803 = torch.aten.select.int %715, %int0_205, %int3 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_206 = torch.constant.int 0 %int3_207 = torch.constant.int 3 %804 = torch.aten.select.int %arg3, %int0_206, %int3_207 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_208 = torch.constant.int 0 %int0_209 = torch.constant.int 0 %int9223372036854775807_210 = torch.constant.int 9223372036854775807 %int1_211 = torch.constant.int 1 %805 = torch.aten.slice.Tensor %804, %int0_208, %int0_209, %int9223372036854775807_210, %int1_211 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_212 = torch.constant.int 16 %806 = torch.aten.floor_divide.Scalar %803, %int16_212 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_213 = torch.constant.int 0 %807 = torch.aten.index_select %805, %int0_213, %806 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_214 = torch.constant.int 16 %808 = torch.aten.remainder.Scalar %803, %int16_214 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_215 = torch.constant.none %809 = torch.aten.clone %250, %none_215 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_216 = torch.constant.none %810 = torch.aten.clone %251, %none_216 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_217 = torch.constant.int 0 %811 = torch.aten.unsqueeze %808, %int0_217 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_218 = torch.constant.int 0 %int3_219 = torch.constant.int 3 %812 = torch.aten.select.int %714, %int0_218, %int3_219 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_220 = torch.constant.int 0 %int0_221 = torch.constant.int 0 %813 = torch.aten.select.int %812, %int0_220, %int0_221 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %814 = torch.prim.ListConstruct %807, %809, %810, %811 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_222 = torch.constant.bool false %815 = torch.aten.index_put %802, %814, %813, %false_222 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_223 = torch.constant.int 2662400 %816 = torch.prim.ListConstruct %731, %int2662400_223 : (!torch.int, !torch.int) -> !torch.list %817 = torch.aten.view %815, %816 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_224 = torch.constant.int -1 %int26_225 = torch.constant.int 26 %int2_226 = torch.constant.int 2 %int16_227 = torch.constant.int 16 %int32_228 = torch.constant.int 32 %int100_229 = torch.constant.int 100 %818 = torch.prim.ListConstruct %int-1_224, %int26_225, %int2_226, %int16_227, %int32_228, %int100_229 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %819 = torch.aten.view %817, %818 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_230 = torch.constant.none %820 = torch.aten.clone %252, %none_230 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_231 = torch.constant.none %821 = torch.aten.clone %253, %none_231 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_232 = torch.constant.int 0 %822 = torch.aten.unsqueeze %808, %int0_232 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_233 = torch.constant.int 0 %int3_234 = torch.constant.int 3 %823 = torch.aten.select.int %700, %int0_233, %int3_234 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_235 = torch.constant.int 0 %int0_236 = torch.constant.int 0 %824 = torch.aten.select.int %823, %int0_235, %int0_236 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %825 = torch.prim.ListConstruct %807, %820, %821, %822 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_237 = torch.constant.bool false %826 = torch.aten.index_put %819, %825, %824, %false_237 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_238 = torch.constant.int 2662400 %827 = torch.prim.ListConstruct %731, %int2662400_238 : (!torch.int, !torch.int) -> !torch.list %828 = torch.aten.view %826, %827 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int0_239 = torch.constant.int 0 %int0_240 = torch.constant.int 0 %int9223372036854775807_241 = torch.constant.int 9223372036854775807 %int1_242 = torch.constant.int 1 %829 = torch.aten.slice.Tensor %671, %int0_239, %int0_240, %int9223372036854775807_241, %int1_242 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_243 = torch.constant.int 16 %830 = torch.aten.mul.int %655, %int16_243 : !torch.int, !torch.int -> !torch.int %int1_244 = torch.constant.int 1 %int0_245 = torch.constant.int 0 %int1_246 = torch.constant.int 1 %831 = torch.aten.slice.Tensor %829, %int1_244, %int0_245, %830, %int1_246 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_247 = torch.constant.int 0 %int0_248 = torch.constant.int 0 %int9223372036854775807_249 = torch.constant.int 9223372036854775807 %int1_250 = torch.constant.int 1 %832 = torch.aten.slice.Tensor %673, %int0_247, %int0_248, %int9223372036854775807_249, %int1_250 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_251 = torch.constant.int 1 %int0_252 = torch.constant.int 0 %int1_253 = torch.constant.int 1 %833 = torch.aten.slice.Tensor %832, %int1_251, %int0_252, %830, %int1_253 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int52 = torch.constant.int 52 %834 = torch.aten.mul.Scalar %arg3, %int52 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int0_254 = torch.constant.int 0 %int1_255 = torch.constant.int 1 %835 = torch.aten.add.Scalar %834, %int0_254, %int1_255 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_256 = torch.constant.int 4 %836 = torch.aten.mul.int %int4_256, %655 : !torch.int, !torch.int -> !torch.int %837 = torch.prim.ListConstruct %836 : (!torch.int) -> !torch.list %838 = torch.aten.view %835, %837 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_257 = torch.constant.int -1 %int26_258 = torch.constant.int 26 %int2_259 = torch.constant.int 2 %int16_260 = torch.constant.int 16 %int32_261 = torch.constant.int 32 %int100_262 = torch.constant.int 100 %839 = torch.prim.ListConstruct %int-1_257, %int26_258, %int2_259, %int16_260, %int32_261, %int100_262 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %840 = torch.aten.view %828, %839 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_263 = torch.constant.int 26 %841 = torch.aten.mul.int %731, %int26_263 : !torch.int, !torch.int -> !torch.int %int2_264 = torch.constant.int 2 %842 = torch.aten.mul.int %841, %int2_264 : !torch.int, !torch.int -> !torch.int %int16_265 = torch.constant.int 16 %int32_266 = torch.constant.int 32 %int100_267 = torch.constant.int 100 %843 = torch.prim.ListConstruct %842, %int16_265, %int32_266, %int100_267 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %844 = torch.aten.view %840, %843 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_268 = torch.constant.int 0 %845 = torch.aten.index_select %844, %int0_268, %838 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_269 = torch.constant.int 4 %int16_270 = torch.constant.int 16 %int32_271 = torch.constant.int 32 %int100_272 = torch.constant.int 100 %846 = torch.prim.ListConstruct %int4_269, %655, %int16_270, %int32_271, %int100_272 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %847 = torch.aten.view %845, %846 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_273 = torch.constant.int 1 %848 = torch.aten.size.int %847, %int1_273 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_274 = torch.constant.int 16 %849 = torch.aten.mul.int %848, %int16_274 : !torch.int, !torch.int -> !torch.int %int4_275 = torch.constant.int 4 %int32_276 = torch.constant.int 32 %int100_277 = torch.constant.int 100 %850 = torch.prim.ListConstruct %int4_275, %849, %int32_276, %int100_277 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %851 = torch.aten.view %847, %850 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %false_278 = torch.constant.bool false %852 = torch.aten.copy %831, %851, %false_278 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_279 = torch.constant.int 0 %int0_280 = torch.constant.int 0 %int9223372036854775807_281 = torch.constant.int 9223372036854775807 %int1_282 = torch.constant.int 1 %853 = torch.aten.slice.Tensor %671, %int0_279, %int0_280, %int9223372036854775807_281, %int1_282 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_283 = torch.constant.int 1 %int0_284 = torch.constant.int 0 %int1_285 = torch.constant.int 1 %854 = torch.aten.slice_scatter %853, %852, %int1_283, %int0_284, %830, %int1_285 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_286 = torch.constant.int 0 %int0_287 = torch.constant.int 0 %int9223372036854775807_288 = torch.constant.int 9223372036854775807 %int1_289 = torch.constant.int 1 %855 = torch.aten.slice_scatter %671, %854, %int0_286, %int0_287, %int9223372036854775807_288, %int1_289 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_290 = torch.constant.int 1 %int1_291 = torch.constant.int 1 %856 = torch.aten.add.Scalar %835, %int1_290, %int1_291 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_292 = torch.constant.int 4 %857 = torch.aten.mul.int %int4_292, %655 : !torch.int, !torch.int -> !torch.int %858 = torch.prim.ListConstruct %857 : (!torch.int) -> !torch.list %859 = torch.aten.view %856, %858 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_293 = torch.constant.int 0 %860 = torch.aten.index_select %844, %int0_293, %859 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_294 = torch.constant.int 4 %int16_295 = torch.constant.int 16 %int32_296 = torch.constant.int 32 %int100_297 = torch.constant.int 100 %861 = torch.prim.ListConstruct %int4_294, %655, %int16_295, %int32_296, %int100_297 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %862 = torch.aten.view %860, %861 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_298 = torch.constant.int 1 %863 = torch.aten.size.int %862, %int1_298 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_299 = torch.constant.int 16 %864 = torch.aten.mul.int %863, %int16_299 : !torch.int, !torch.int -> !torch.int %int4_300 = torch.constant.int 4 %int32_301 = torch.constant.int 32 %int100_302 = torch.constant.int 100 %865 = torch.prim.ListConstruct %int4_300, %864, %int32_301, %int100_302 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %866 = torch.aten.view %862, %865 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %false_303 = torch.constant.bool false %867 = torch.aten.copy %833, %866, %false_303 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_304 = torch.constant.int 0 %int0_305 = torch.constant.int 0 %int9223372036854775807_306 = torch.constant.int 9223372036854775807 %int1_307 = torch.constant.int 1 %868 = torch.aten.slice.Tensor %673, %int0_304, %int0_305, %int9223372036854775807_306, %int1_307 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_308 = torch.constant.int 1 %int0_309 = torch.constant.int 0 %int1_310 = torch.constant.int 1 %869 = torch.aten.slice_scatter %868, %867, %int1_308, %int0_309, %830, %int1_310 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_311 = torch.constant.int 0 %int0_312 = torch.constant.int 0 %int9223372036854775807_313 = torch.constant.int 9223372036854775807 %int1_314 = torch.constant.int 1 %870 = torch.aten.slice_scatter %673, %869, %int0_311, %int0_312, %int9223372036854775807_313, %int1_314 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_315 = torch.constant.int 0 %int0_316 = torch.constant.int 0 %int9223372036854775807_317 = torch.constant.int 9223372036854775807 %int1_318 = torch.constant.int 1 %871 = torch.aten.slice.Tensor %671, %int0_315, %int0_316, %int9223372036854775807_317, %int1_318 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_319 = torch.constant.int 1 %int0_320 = torch.constant.int 0 %int1_321 = torch.constant.int 1 %872 = torch.aten.slice.Tensor %871, %int1_319, %int0_320, %830, %int1_321 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_322 = torch.constant.int 0 %int0_323 = torch.constant.int 0 %int9223372036854775807_324 = torch.constant.int 9223372036854775807 %int1_325 = torch.constant.int 1 %873 = torch.aten.slice.Tensor %673, %int0_322, %int0_323, %int9223372036854775807_324, %int1_325 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_326 = torch.constant.int 1 %int0_327 = torch.constant.int 0 %int1_328 = torch.constant.int 1 %874 = torch.aten.slice.Tensor %873, %int1_326, %int0_327, %830, %int1_328 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_329 = torch.constant.int 1 %int2_330 = torch.constant.int 2 %875 = torch.aten.transpose.int %710, %int1_329, %int2_330 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_331 = torch.constant.int 4 %int32_332 = torch.constant.int 32 %int1_333 = torch.constant.int 1 %int100_334 = torch.constant.int 100 %876 = torch.prim.ListConstruct %int4_331, %int32_332, %int1_333, %int100_334 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_335 = torch.constant.bool false %877 = torch.aten.expand %875, %876, %false_335 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128 = torch.constant.int 128 %int1_336 = torch.constant.int 1 %int100_337 = torch.constant.int 100 %878 = torch.prim.ListConstruct %int128, %int1_336, %int100_337 : (!torch.int, !torch.int, !torch.int) -> !torch.list %879 = torch.aten.view %877, %878 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_338 = torch.constant.int 0 %int0_339 = torch.constant.int 0 %int9223372036854775807_340 = torch.constant.int 9223372036854775807 %int1_341 = torch.constant.int 1 %880 = torch.aten.slice.Tensor %855, %int0_338, %int0_339, %int9223372036854775807_340, %int1_341 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_342 = torch.constant.int 1 %int0_343 = torch.constant.int 0 %int1_344 = torch.constant.int 1 %881 = torch.aten.slice.Tensor %880, %int1_342, %int0_343, %830, %int1_344 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_345 = torch.constant.int 1 %int2_346 = torch.constant.int 2 %882 = torch.aten.transpose.int %881, %int1_345, %int2_346 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_347 = torch.constant.int 2 %int3_348 = torch.constant.int 3 %883 = torch.aten.transpose.int %882, %int2_347, %int3_348 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_349 = torch.constant.int 1 %884 = torch.aten.size.int %872, %int1_349 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_350 = torch.constant.int 4 %int32_351 = torch.constant.int 32 %int100_352 = torch.constant.int 100 %885 = torch.prim.ListConstruct %int4_350, %int32_351, %int100_352, %884 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_353 = torch.constant.bool false %886 = torch.aten.expand %883, %885, %false_353 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_354 = torch.constant.int 0 %887 = torch.aten.clone %886, %int0_354 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_355 = torch.constant.int 128 %int100_356 = torch.constant.int 100 %888 = torch.prim.ListConstruct %int128_355, %int100_356, %884 : (!torch.int, !torch.int, !torch.int) -> !torch.list %889 = torch.aten._unsafe_view %887, %888 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %890 = torch.aten.bmm %879, %889 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_357 = torch.constant.int 4 %int32_358 = torch.constant.int 32 %int1_359 = torch.constant.int 1 %891 = torch.prim.ListConstruct %int4_357, %int32_358, %int1_359, %884 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %892 = torch.aten.view %890, %891 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01 = torch.constant.float 1.000000e+01 %893 = torch.aten.div.Scalar %892, %float1.000000e01 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_360 = torch.constant.int 1 %894 = torch.aten.unsqueeze %662, %int1_360 : !torch.vtensor<[4,?],f32>, !torch.int -> !torch.vtensor<[4,1,?],f32> %int1_361 = torch.constant.int 1 %895 = torch.aten.unsqueeze %894, %int1_361 : !torch.vtensor<[4,1,?],f32>, !torch.int -> !torch.vtensor<[4,1,1,?],f32> %int1_362 = torch.constant.int 1 %896 = torch.aten.add.Tensor %893, %895, %int1_362 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_363 = torch.constant.int -1 %false_364 = torch.constant.bool false %897 = torch.aten._softmax %896, %int-1_363, %false_364 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_365 = torch.constant.int 4 %int32_366 = torch.constant.int 32 %int1_367 = torch.constant.int 1 %898 = torch.prim.ListConstruct %int4_365, %int32_366, %int1_367, %884 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_368 = torch.constant.bool false %899 = torch.aten.expand %897, %898, %false_368 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_369 = torch.constant.int 128 %int1_370 = torch.constant.int 1 %900 = torch.prim.ListConstruct %int128_369, %int1_370, %884 : (!torch.int, !torch.int, !torch.int) -> !torch.list %901 = torch.aten.view %899, %900 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_371 = torch.constant.int 0 %int0_372 = torch.constant.int 0 %int9223372036854775807_373 = torch.constant.int 9223372036854775807 %int1_374 = torch.constant.int 1 %902 = torch.aten.slice.Tensor %870, %int0_371, %int0_372, %int9223372036854775807_373, %int1_374 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_375 = torch.constant.int 1 %int0_376 = torch.constant.int 0 %int1_377 = torch.constant.int 1 %903 = torch.aten.slice.Tensor %902, %int1_375, %int0_376, %830, %int1_377 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_378 = torch.constant.int 1 %int2_379 = torch.constant.int 2 %904 = torch.aten.transpose.int %903, %int1_378, %int2_379 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_380 = torch.constant.int 1 %905 = torch.aten.size.int %874, %int1_380 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_381 = torch.constant.int 4 %int32_382 = torch.constant.int 32 %int100_383 = torch.constant.int 100 %906 = torch.prim.ListConstruct %int4_381, %int32_382, %905, %int100_383 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_384 = torch.constant.bool false %907 = torch.aten.expand %904, %906, %false_384 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_385 = torch.constant.int 0 %908 = torch.aten.clone %907, %int0_385 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_386 = torch.constant.int 128 %int100_387 = torch.constant.int 100 %909 = torch.prim.ListConstruct %int128_386, %905, %int100_387 : (!torch.int, !torch.int, !torch.int) -> !torch.list %910 = torch.aten._unsafe_view %908, %909 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %911 = torch.aten.bmm %901, %910 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_388 = torch.constant.int 4 %int32_389 = torch.constant.int 32 %int1_390 = torch.constant.int 1 %int100_391 = torch.constant.int 100 %912 = torch.prim.ListConstruct %int4_388, %int32_389, %int1_390, %int100_391 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %913 = torch.aten.view %911, %912 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_392 = torch.constant.int 1 %int2_393 = torch.constant.int 2 %914 = torch.aten.transpose.int %913, %int1_392, %int2_393 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_394 = torch.constant.int 4 %int1_395 = torch.constant.int 1 %int-1_396 = torch.constant.int -1 %915 = torch.prim.ListConstruct %int4_394, %int1_395, %int-1_396 : (!torch.int, !torch.int, !torch.int) -> !torch.list %916 = torch.aten.view %914, %915 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %917 = torch_c.to_builtin_tensor %916 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_397 = tensor.cast %917 : tensor<4x1x3200xf32> to tensor %918 = torch_c.to_builtin_tensor %6 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %919 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_397, %918) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_398 = tensor.cast %919 : tensor to tensor<4x1x3200xf32> %920 = torch_c.from_builtin_tensor %cast_398 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_399 = torch.constant.int 1 %921 = torch.aten.add.Tensor %675, %920, %int1_399 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_400 = torch.constant.int 2 %922 = torch.aten.pow.Tensor_Scalar %921, %int2_400 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_401 = torch.constant.int -1 %923 = torch.prim.ListConstruct %int-1_401 : (!torch.int) -> !torch.list %true_402 = torch.constant.bool true %none_403 = torch.constant.none %924 = torch.aten.mean.dim %922, %923, %true_402, %none_403 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_404 = torch.constant.float 9.9999999747524271E-7 %int1_405 = torch.constant.int 1 %925 = torch.aten.add.Scalar %924, %float9.999990e-07_404, %int1_405 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %926 = torch.aten.rsqrt %925 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %927 = torch.aten.mul.Tensor %921, %926 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %928 = torch.aten.mul.Tensor %927, %7 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %929 = torch_c.to_builtin_tensor %928 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_406 = tensor.cast %929 : tensor<4x1x3200xf32> to tensor %930 = torch_c.to_builtin_tensor %8 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %931 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_406, %930) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_407 = tensor.cast %931 : tensor to tensor<4x1x8640xf32> %932 = torch_c.from_builtin_tensor %cast_407 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %933 = torch.aten.silu %932 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %934 = torch_c.to_builtin_tensor %928 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_408 = tensor.cast %934 : tensor<4x1x3200xf32> to tensor %935 = torch_c.to_builtin_tensor %9 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %936 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_408, %935) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_409 = tensor.cast %936 : tensor to tensor<4x1x8640xf32> %937 = torch_c.from_builtin_tensor %cast_409 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %938 = torch.aten.mul.Tensor %933, %937 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %939 = torch_c.to_builtin_tensor %938 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_410 = tensor.cast %939 : tensor<4x1x8640xf32> to tensor %940 = torch_c.to_builtin_tensor %10 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %941 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_410, %940) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_411 = tensor.cast %941 : tensor to tensor<4x1x3200xf32> %942 = torch_c.from_builtin_tensor %cast_411 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_412 = torch.constant.int 1 %943 = torch.aten.add.Tensor %921, %942, %int1_412 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_413 = torch.constant.int 2 %944 = torch.aten.pow.Tensor_Scalar %943, %int2_413 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_414 = torch.constant.int -1 %945 = torch.prim.ListConstruct %int-1_414 : (!torch.int) -> !torch.list %true_415 = torch.constant.bool true %none_416 = torch.constant.none %946 = torch.aten.mean.dim %944, %945, %true_415, %none_416 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_417 = torch.constant.float 9.9999999747524271E-7 %int1_418 = torch.constant.int 1 %947 = torch.aten.add.Scalar %946, %float9.999990e-07_417, %int1_418 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %948 = torch.aten.rsqrt %947 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %949 = torch.aten.mul.Tensor %943, %948 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %950 = torch.aten.mul.Tensor %949, %11 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %951 = torch_c.to_builtin_tensor %950 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_419 = tensor.cast %951 : tensor<4x1x3200xf32> to tensor %952 = torch_c.to_builtin_tensor %12 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %953 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_419, %952) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_420 = tensor.cast %953 : tensor to tensor<4x1x3200xf32> %954 = torch_c.from_builtin_tensor %cast_420 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %955 = torch_c.to_builtin_tensor %950 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_421 = tensor.cast %955 : tensor<4x1x3200xf32> to tensor %956 = torch_c.to_builtin_tensor %13 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %957 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_421, %956) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_422 = tensor.cast %957 : tensor to tensor<4x1x3200xf32> %958 = torch_c.from_builtin_tensor %cast_422 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %959 = torch_c.to_builtin_tensor %950 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_423 = tensor.cast %959 : tensor<4x1x3200xf32> to tensor %960 = torch_c.to_builtin_tensor %14 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %961 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_423, %960) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_424 = tensor.cast %961 : tensor to tensor<4x1x3200xf32> %962 = torch_c.from_builtin_tensor %cast_424 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_425 = torch.constant.int 4 %int1_426 = torch.constant.int 1 %int32_427 = torch.constant.int 32 %int100_428 = torch.constant.int 100 %963 = torch.prim.ListConstruct %int4_425, %int1_426, %int32_427, %int100_428 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %964 = torch.aten.view %954, %963 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_429 = torch.constant.int 4 %int1_430 = torch.constant.int 1 %int32_431 = torch.constant.int 32 %int100_432 = torch.constant.int 100 %965 = torch.prim.ListConstruct %int4_429, %int1_430, %int32_431, %int100_432 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %966 = torch.aten.view %958, %965 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_433 = torch.constant.int 4 %int1_434 = torch.constant.int 1 %int32_435 = torch.constant.int 32 %int100_436 = torch.constant.int 100 %967 = torch.prim.ListConstruct %int4_433, %int1_434, %int32_435, %int100_436 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %968 = torch.aten.view %962, %967 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_437 = torch.constant.int 4 %int1_438 = torch.constant.int 1 %int32_439 = torch.constant.int 32 %int-1_440 = torch.constant.int -1 %int2_441 = torch.constant.int 2 %969 = torch.prim.ListConstruct %int4_437, %int1_438, %int32_439, %int-1_440, %int2_441 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %970 = torch.aten.view %964, %969 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %971 = torch.aten.view_as_complex %970 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_442 = torch.constant.int 4 %int1_443 = torch.constant.int 1 %int32_444 = torch.constant.int 32 %int-1_445 = torch.constant.int -1 %int2_446 = torch.constant.int 2 %972 = torch.prim.ListConstruct %int4_442, %int1_443, %int32_444, %int-1_445, %int2_446 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %973 = torch.aten.view %966, %972 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %974 = torch.aten.view_as_complex %973 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %975 = torch.aten.mul.Tensor %971, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %976 = torch.aten.view_as_real %975 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_447 = torch.constant.int 4 %int1_448 = torch.constant.int 1 %int32_449 = torch.constant.int 32 %int100_450 = torch.constant.int 100 %977 = torch.prim.ListConstruct %int4_447, %int1_448, %int32_449, %int100_450 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %978 = torch.aten.view %976, %977 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %979 = torch.aten.mul.Tensor %974, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %980 = torch.aten.view_as_real %979 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_451 = torch.constant.int 4 %int1_452 = torch.constant.int 1 %int32_453 = torch.constant.int 32 %int100_454 = torch.constant.int 100 %981 = torch.prim.ListConstruct %int4_451, %int1_452, %int32_453, %int100_454 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %982 = torch.aten.view %980, %981 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_455 = torch.constant.int 1 %int1_456 = torch.constant.int 1 %983 = torch.aten.add.Scalar %arg2, %int1_455, %int1_456 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_457 = torch.constant.int 0 %int0_458 = torch.constant.int 0 %984 = torch.aten.select.int %983, %int0_457, %int0_458 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_459 = torch.constant.int 0 %int0_460 = torch.constant.int 0 %985 = torch.aten.select.int %arg3, %int0_459, %int0_460 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_461 = torch.constant.int 0 %int0_462 = torch.constant.int 0 %int9223372036854775807_463 = torch.constant.int 9223372036854775807 %int1_464 = torch.constant.int 1 %986 = torch.aten.slice.Tensor %985, %int0_461, %int0_462, %int9223372036854775807_463, %int1_464 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_465 = torch.constant.int 16 %987 = torch.aten.floor_divide.Scalar %984, %int16_465 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_466 = torch.constant.int 0 %988 = torch.aten.index_select %986, %int0_466, %987 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_467 = torch.constant.int 16 %989 = torch.aten.remainder.Scalar %984, %int16_467 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_468 = torch.constant.none %990 = torch.aten.clone %254, %none_468 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_469 = torch.constant.none %991 = torch.aten.clone %255, %none_469 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_470 = torch.constant.int 0 %992 = torch.aten.unsqueeze %989, %int0_470 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_471 = torch.constant.int 0 %int0_472 = torch.constant.int 0 %993 = torch.aten.select.int %982, %int0_471, %int0_472 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_473 = torch.constant.int 0 %int0_474 = torch.constant.int 0 %994 = torch.aten.select.int %993, %int0_473, %int0_474 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_475 = torch.constant.int -1 %int26_476 = torch.constant.int 26 %int2_477 = torch.constant.int 2 %int16_478 = torch.constant.int 16 %int32_479 = torch.constant.int 32 %int100_480 = torch.constant.int 100 %995 = torch.prim.ListConstruct %int-1_475, %int26_476, %int2_477, %int16_478, %int32_479, %int100_480 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %996 = torch.aten.view %828, %995 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %997 = torch.prim.ListConstruct %988, %990, %991, %992 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_481 = torch.constant.bool false %998 = torch.aten.index_put %996, %997, %994, %false_481 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_482 = torch.constant.int 2662400 %999 = torch.prim.ListConstruct %731, %int2662400_482 : (!torch.int, !torch.int) -> !torch.list %1000 = torch.aten.view %998, %999 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_483 = torch.constant.int -1 %int26_484 = torch.constant.int 26 %int2_485 = torch.constant.int 2 %int16_486 = torch.constant.int 16 %int32_487 = torch.constant.int 32 %int100_488 = torch.constant.int 100 %1001 = torch.prim.ListConstruct %int-1_483, %int26_484, %int2_485, %int16_486, %int32_487, %int100_488 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1002 = torch.aten.view %1000, %1001 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_489 = torch.constant.none %1003 = torch.aten.clone %256, %none_489 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_490 = torch.constant.none %1004 = torch.aten.clone %257, %none_490 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_491 = torch.constant.int 0 %1005 = torch.aten.unsqueeze %989, %int0_491 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_492 = torch.constant.int 0 %int0_493 = torch.constant.int 0 %1006 = torch.aten.select.int %968, %int0_492, %int0_493 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_494 = torch.constant.int 0 %int0_495 = torch.constant.int 0 %1007 = torch.aten.select.int %1006, %int0_494, %int0_495 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1008 = torch.prim.ListConstruct %988, %1003, %1004, %1005 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_496 = torch.constant.bool false %1009 = torch.aten.index_put %1002, %1008, %1007, %false_496 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_497 = torch.constant.int 2662400 %1010 = torch.prim.ListConstruct %731, %int2662400_497 : (!torch.int, !torch.int) -> !torch.list %1011 = torch.aten.view %1009, %1010 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_498 = torch.constant.int -1 %int26_499 = torch.constant.int 26 %int2_500 = torch.constant.int 2 %int16_501 = torch.constant.int 16 %int32_502 = torch.constant.int 32 %int100_503 = torch.constant.int 100 %1012 = torch.prim.ListConstruct %int-1_498, %int26_499, %int2_500, %int16_501, %int32_502, %int100_503 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1013 = torch.aten.view %1011, %1012 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_504 = torch.constant.int 0 %int1_505 = torch.constant.int 1 %1014 = torch.aten.select.int %983, %int0_504, %int1_505 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_506 = torch.constant.int 0 %int1_507 = torch.constant.int 1 %1015 = torch.aten.select.int %arg3, %int0_506, %int1_507 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_508 = torch.constant.int 0 %int0_509 = torch.constant.int 0 %int9223372036854775807_510 = torch.constant.int 9223372036854775807 %int1_511 = torch.constant.int 1 %1016 = torch.aten.slice.Tensor %1015, %int0_508, %int0_509, %int9223372036854775807_510, %int1_511 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_512 = torch.constant.int 16 %1017 = torch.aten.floor_divide.Scalar %1014, %int16_512 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_513 = torch.constant.int 0 %1018 = torch.aten.index_select %1016, %int0_513, %1017 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_514 = torch.constant.int 16 %1019 = torch.aten.remainder.Scalar %1014, %int16_514 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_515 = torch.constant.none %1020 = torch.aten.clone %258, %none_515 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_516 = torch.constant.none %1021 = torch.aten.clone %259, %none_516 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_517 = torch.constant.int 0 %1022 = torch.aten.unsqueeze %1019, %int0_517 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_518 = torch.constant.int 0 %int1_519 = torch.constant.int 1 %1023 = torch.aten.select.int %982, %int0_518, %int1_519 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_520 = torch.constant.int 0 %int0_521 = torch.constant.int 0 %1024 = torch.aten.select.int %1023, %int0_520, %int0_521 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1025 = torch.prim.ListConstruct %1018, %1020, %1021, %1022 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_522 = torch.constant.bool false %1026 = torch.aten.index_put %1013, %1025, %1024, %false_522 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_523 = torch.constant.int 2662400 %1027 = torch.prim.ListConstruct %731, %int2662400_523 : (!torch.int, !torch.int) -> !torch.list %1028 = torch.aten.view %1026, %1027 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_524 = torch.constant.int -1 %int26_525 = torch.constant.int 26 %int2_526 = torch.constant.int 2 %int16_527 = torch.constant.int 16 %int32_528 = torch.constant.int 32 %int100_529 = torch.constant.int 100 %1029 = torch.prim.ListConstruct %int-1_524, %int26_525, %int2_526, %int16_527, %int32_528, %int100_529 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1030 = torch.aten.view %1028, %1029 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_530 = torch.constant.none %1031 = torch.aten.clone %260, %none_530 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_531 = torch.constant.none %1032 = torch.aten.clone %261, %none_531 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_532 = torch.constant.int 0 %1033 = torch.aten.unsqueeze %1019, %int0_532 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_533 = torch.constant.int 0 %int1_534 = torch.constant.int 1 %1034 = torch.aten.select.int %968, %int0_533, %int1_534 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_535 = torch.constant.int 0 %int0_536 = torch.constant.int 0 %1035 = torch.aten.select.int %1034, %int0_535, %int0_536 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1036 = torch.prim.ListConstruct %1018, %1031, %1032, %1033 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_537 = torch.constant.bool false %1037 = torch.aten.index_put %1030, %1036, %1035, %false_537 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_538 = torch.constant.int 2662400 %1038 = torch.prim.ListConstruct %731, %int2662400_538 : (!torch.int, !torch.int) -> !torch.list %1039 = torch.aten.view %1037, %1038 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_539 = torch.constant.int -1 %int26_540 = torch.constant.int 26 %int2_541 = torch.constant.int 2 %int16_542 = torch.constant.int 16 %int32_543 = torch.constant.int 32 %int100_544 = torch.constant.int 100 %1040 = torch.prim.ListConstruct %int-1_539, %int26_540, %int2_541, %int16_542, %int32_543, %int100_544 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1041 = torch.aten.view %1039, %1040 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_545 = torch.constant.int 0 %int2_546 = torch.constant.int 2 %1042 = torch.aten.select.int %983, %int0_545, %int2_546 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_547 = torch.constant.int 0 %int2_548 = torch.constant.int 2 %1043 = torch.aten.select.int %arg3, %int0_547, %int2_548 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_549 = torch.constant.int 0 %int0_550 = torch.constant.int 0 %int9223372036854775807_551 = torch.constant.int 9223372036854775807 %int1_552 = torch.constant.int 1 %1044 = torch.aten.slice.Tensor %1043, %int0_549, %int0_550, %int9223372036854775807_551, %int1_552 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_553 = torch.constant.int 16 %1045 = torch.aten.floor_divide.Scalar %1042, %int16_553 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_554 = torch.constant.int 0 %1046 = torch.aten.index_select %1044, %int0_554, %1045 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_555 = torch.constant.int 16 %1047 = torch.aten.remainder.Scalar %1042, %int16_555 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_556 = torch.constant.none %1048 = torch.aten.clone %262, %none_556 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_557 = torch.constant.none %1049 = torch.aten.clone %263, %none_557 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_558 = torch.constant.int 0 %1050 = torch.aten.unsqueeze %1047, %int0_558 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_559 = torch.constant.int 0 %int2_560 = torch.constant.int 2 %1051 = torch.aten.select.int %982, %int0_559, %int2_560 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_561 = torch.constant.int 0 %int0_562 = torch.constant.int 0 %1052 = torch.aten.select.int %1051, %int0_561, %int0_562 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1053 = torch.prim.ListConstruct %1046, %1048, %1049, %1050 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_563 = torch.constant.bool false %1054 = torch.aten.index_put %1041, %1053, %1052, %false_563 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_564 = torch.constant.int 2662400 %1055 = torch.prim.ListConstruct %731, %int2662400_564 : (!torch.int, !torch.int) -> !torch.list %1056 = torch.aten.view %1054, %1055 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_565 = torch.constant.int -1 %int26_566 = torch.constant.int 26 %int2_567 = torch.constant.int 2 %int16_568 = torch.constant.int 16 %int32_569 = torch.constant.int 32 %int100_570 = torch.constant.int 100 %1057 = torch.prim.ListConstruct %int-1_565, %int26_566, %int2_567, %int16_568, %int32_569, %int100_570 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1058 = torch.aten.view %1056, %1057 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_571 = torch.constant.none %1059 = torch.aten.clone %264, %none_571 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_572 = torch.constant.none %1060 = torch.aten.clone %265, %none_572 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_573 = torch.constant.int 0 %1061 = torch.aten.unsqueeze %1047, %int0_573 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_574 = torch.constant.int 0 %int2_575 = torch.constant.int 2 %1062 = torch.aten.select.int %968, %int0_574, %int2_575 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_576 = torch.constant.int 0 %int0_577 = torch.constant.int 0 %1063 = torch.aten.select.int %1062, %int0_576, %int0_577 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1064 = torch.prim.ListConstruct %1046, %1059, %1060, %1061 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_578 = torch.constant.bool false %1065 = torch.aten.index_put %1058, %1064, %1063, %false_578 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_579 = torch.constant.int 2662400 %1066 = torch.prim.ListConstruct %731, %int2662400_579 : (!torch.int, !torch.int) -> !torch.list %1067 = torch.aten.view %1065, %1066 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_580 = torch.constant.int -1 %int26_581 = torch.constant.int 26 %int2_582 = torch.constant.int 2 %int16_583 = torch.constant.int 16 %int32_584 = torch.constant.int 32 %int100_585 = torch.constant.int 100 %1068 = torch.prim.ListConstruct %int-1_580, %int26_581, %int2_582, %int16_583, %int32_584, %int100_585 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1069 = torch.aten.view %1067, %1068 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_586 = torch.constant.int 0 %int3_587 = torch.constant.int 3 %1070 = torch.aten.select.int %983, %int0_586, %int3_587 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_588 = torch.constant.int 0 %int3_589 = torch.constant.int 3 %1071 = torch.aten.select.int %arg3, %int0_588, %int3_589 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_590 = torch.constant.int 0 %int0_591 = torch.constant.int 0 %int9223372036854775807_592 = torch.constant.int 9223372036854775807 %int1_593 = torch.constant.int 1 %1072 = torch.aten.slice.Tensor %1071, %int0_590, %int0_591, %int9223372036854775807_592, %int1_593 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_594 = torch.constant.int 16 %1073 = torch.aten.floor_divide.Scalar %1070, %int16_594 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_595 = torch.constant.int 0 %1074 = torch.aten.index_select %1072, %int0_595, %1073 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_596 = torch.constant.int 16 %1075 = torch.aten.remainder.Scalar %1070, %int16_596 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_597 = torch.constant.none %1076 = torch.aten.clone %266, %none_597 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_598 = torch.constant.none %1077 = torch.aten.clone %267, %none_598 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_599 = torch.constant.int 0 %1078 = torch.aten.unsqueeze %1075, %int0_599 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_600 = torch.constant.int 0 %int3_601 = torch.constant.int 3 %1079 = torch.aten.select.int %982, %int0_600, %int3_601 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_602 = torch.constant.int 0 %int0_603 = torch.constant.int 0 %1080 = torch.aten.select.int %1079, %int0_602, %int0_603 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1081 = torch.prim.ListConstruct %1074, %1076, %1077, %1078 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_604 = torch.constant.bool false %1082 = torch.aten.index_put %1069, %1081, %1080, %false_604 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_605 = torch.constant.int 2662400 %1083 = torch.prim.ListConstruct %731, %int2662400_605 : (!torch.int, !torch.int) -> !torch.list %1084 = torch.aten.view %1082, %1083 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_606 = torch.constant.int -1 %int26_607 = torch.constant.int 26 %int2_608 = torch.constant.int 2 %int16_609 = torch.constant.int 16 %int32_610 = torch.constant.int 32 %int100_611 = torch.constant.int 100 %1085 = torch.prim.ListConstruct %int-1_606, %int26_607, %int2_608, %int16_609, %int32_610, %int100_611 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1086 = torch.aten.view %1084, %1085 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_612 = torch.constant.none %1087 = torch.aten.clone %268, %none_612 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_613 = torch.constant.none %1088 = torch.aten.clone %269, %none_613 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_614 = torch.constant.int 0 %1089 = torch.aten.unsqueeze %1075, %int0_614 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_615 = torch.constant.int 0 %int3_616 = torch.constant.int 3 %1090 = torch.aten.select.int %968, %int0_615, %int3_616 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_617 = torch.constant.int 0 %int0_618 = torch.constant.int 0 %1091 = torch.aten.select.int %1090, %int0_617, %int0_618 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1092 = torch.prim.ListConstruct %1074, %1087, %1088, %1089 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_619 = torch.constant.bool false %1093 = torch.aten.index_put %1086, %1092, %1091, %false_619 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_620 = torch.constant.int 2662400 %1094 = torch.prim.ListConstruct %731, %int2662400_620 : (!torch.int, !torch.int) -> !torch.list %1095 = torch.aten.view %1093, %1094 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_621 = torch.constant.int 52 %1096 = torch.aten.mul.Scalar %arg3, %int52_621 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int2_622 = torch.constant.int 2 %int1_623 = torch.constant.int 1 %1097 = torch.aten.add.Scalar %1096, %int2_622, %int1_623 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_624 = torch.constant.int 4 %1098 = torch.aten.mul.int %int4_624, %655 : !torch.int, !torch.int -> !torch.int %1099 = torch.prim.ListConstruct %1098 : (!torch.int) -> !torch.list %1100 = torch.aten.view %1097, %1099 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_625 = torch.constant.int -1 %int26_626 = torch.constant.int 26 %int2_627 = torch.constant.int 2 %int16_628 = torch.constant.int 16 %int32_629 = torch.constant.int 32 %int100_630 = torch.constant.int 100 %1101 = torch.prim.ListConstruct %int-1_625, %int26_626, %int2_627, %int16_628, %int32_629, %int100_630 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1102 = torch.aten.view %1095, %1101 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_631 = torch.constant.int 26 %1103 = torch.aten.mul.int %731, %int26_631 : !torch.int, !torch.int -> !torch.int %int2_632 = torch.constant.int 2 %1104 = torch.aten.mul.int %1103, %int2_632 : !torch.int, !torch.int -> !torch.int %int16_633 = torch.constant.int 16 %int32_634 = torch.constant.int 32 %int100_635 = torch.constant.int 100 %1105 = torch.prim.ListConstruct %1104, %int16_633, %int32_634, %int100_635 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1106 = torch.aten.view %1102, %1105 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_636 = torch.constant.int 0 %1107 = torch.aten.index_select %1106, %int0_636, %1100 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_637 = torch.constant.int 4 %int16_638 = torch.constant.int 16 %int32_639 = torch.constant.int 32 %int100_640 = torch.constant.int 100 %1108 = torch.prim.ListConstruct %int4_637, %655, %int16_638, %int32_639, %int100_640 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1109 = torch.aten.view %1107, %1108 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_641 = torch.constant.int 1 %1110 = torch.aten.size.int %1109, %int1_641 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_642 = torch.constant.int 16 %1111 = torch.aten.mul.int %1110, %int16_642 : !torch.int, !torch.int -> !torch.int %int4_643 = torch.constant.int 4 %int32_644 = torch.constant.int 32 %int100_645 = torch.constant.int 100 %1112 = torch.prim.ListConstruct %int4_643, %1111, %int32_644, %int100_645 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1113 = torch.aten.view %1109, %1112 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_646 = torch.constant.int 0 %int0_647 = torch.constant.int 0 %int9223372036854775807_648 = torch.constant.int 9223372036854775807 %int1_649 = torch.constant.int 1 %1114 = torch.aten.slice.Tensor %855, %int0_646, %int0_647, %int9223372036854775807_648, %int1_649 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_650 = torch.constant.int 16 %1115 = torch.aten.mul.int %655, %int16_650 : !torch.int, !torch.int -> !torch.int %int1_651 = torch.constant.int 1 %int0_652 = torch.constant.int 0 %int1_653 = torch.constant.int 1 %1116 = torch.aten.slice.Tensor %1114, %int1_651, %int0_652, %1115, %int1_653 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_654 = torch.constant.bool false %1117 = torch.aten.copy %1116, %1113, %false_654 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_655 = torch.constant.int 0 %int0_656 = torch.constant.int 0 %int9223372036854775807_657 = torch.constant.int 9223372036854775807 %int1_658 = torch.constant.int 1 %1118 = torch.aten.slice.Tensor %855, %int0_655, %int0_656, %int9223372036854775807_657, %int1_658 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_659 = torch.constant.int 1 %int0_660 = torch.constant.int 0 %int1_661 = torch.constant.int 1 %1119 = torch.aten.slice_scatter %1118, %1117, %int1_659, %int0_660, %1115, %int1_661 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_662 = torch.constant.int 0 %int0_663 = torch.constant.int 0 %int9223372036854775807_664 = torch.constant.int 9223372036854775807 %int1_665 = torch.constant.int 1 %1120 = torch.aten.slice_scatter %855, %1119, %int0_662, %int0_663, %int9223372036854775807_664, %int1_665 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_666 = torch.constant.int 1 %int1_667 = torch.constant.int 1 %1121 = torch.aten.add.Scalar %1097, %int1_666, %int1_667 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_668 = torch.constant.int 4 %1122 = torch.aten.mul.int %int4_668, %655 : !torch.int, !torch.int -> !torch.int %1123 = torch.prim.ListConstruct %1122 : (!torch.int) -> !torch.list %1124 = torch.aten.view %1121, %1123 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_669 = torch.constant.int 0 %1125 = torch.aten.index_select %1106, %int0_669, %1124 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_670 = torch.constant.int 4 %int16_671 = torch.constant.int 16 %int32_672 = torch.constant.int 32 %int100_673 = torch.constant.int 100 %1126 = torch.prim.ListConstruct %int4_670, %655, %int16_671, %int32_672, %int100_673 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1127 = torch.aten.view %1125, %1126 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_674 = torch.constant.int 1 %1128 = torch.aten.size.int %1127, %int1_674 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_675 = torch.constant.int 16 %1129 = torch.aten.mul.int %1128, %int16_675 : !torch.int, !torch.int -> !torch.int %int4_676 = torch.constant.int 4 %int32_677 = torch.constant.int 32 %int100_678 = torch.constant.int 100 %1130 = torch.prim.ListConstruct %int4_676, %1129, %int32_677, %int100_678 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1131 = torch.aten.view %1127, %1130 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_679 = torch.constant.int 0 %int0_680 = torch.constant.int 0 %int9223372036854775807_681 = torch.constant.int 9223372036854775807 %int1_682 = torch.constant.int 1 %1132 = torch.aten.slice.Tensor %870, %int0_679, %int0_680, %int9223372036854775807_681, %int1_682 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_683 = torch.constant.int 1 %int0_684 = torch.constant.int 0 %int1_685 = torch.constant.int 1 %1133 = torch.aten.slice.Tensor %1132, %int1_683, %int0_684, %1115, %int1_685 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_686 = torch.constant.bool false %1134 = torch.aten.copy %1133, %1131, %false_686 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_687 = torch.constant.int 0 %int0_688 = torch.constant.int 0 %int9223372036854775807_689 = torch.constant.int 9223372036854775807 %int1_690 = torch.constant.int 1 %1135 = torch.aten.slice.Tensor %870, %int0_687, %int0_688, %int9223372036854775807_689, %int1_690 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_691 = torch.constant.int 1 %int0_692 = torch.constant.int 0 %int1_693 = torch.constant.int 1 %1136 = torch.aten.slice_scatter %1135, %1134, %int1_691, %int0_692, %1115, %int1_693 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_694 = torch.constant.int 0 %int0_695 = torch.constant.int 0 %int9223372036854775807_696 = torch.constant.int 9223372036854775807 %int1_697 = torch.constant.int 1 %1137 = torch.aten.slice_scatter %870, %1136, %int0_694, %int0_695, %int9223372036854775807_696, %int1_697 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_698 = torch.constant.int 0 %int0_699 = torch.constant.int 0 %int9223372036854775807_700 = torch.constant.int 9223372036854775807 %int1_701 = torch.constant.int 1 %1138 = torch.aten.slice.Tensor %671, %int0_698, %int0_699, %int9223372036854775807_700, %int1_701 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_702 = torch.constant.int 1 %int0_703 = torch.constant.int 0 %int1_704 = torch.constant.int 1 %1139 = torch.aten.slice.Tensor %1138, %int1_702, %int0_703, %1115, %int1_704 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_705 = torch.constant.int 0 %int0_706 = torch.constant.int 0 %int9223372036854775807_707 = torch.constant.int 9223372036854775807 %int1_708 = torch.constant.int 1 %1140 = torch.aten.slice.Tensor %673, %int0_705, %int0_706, %int9223372036854775807_707, %int1_708 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_709 = torch.constant.int 1 %int0_710 = torch.constant.int 0 %int1_711 = torch.constant.int 1 %1141 = torch.aten.slice.Tensor %1140, %int1_709, %int0_710, %1115, %int1_711 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_712 = torch.constant.int 1 %int2_713 = torch.constant.int 2 %1142 = torch.aten.transpose.int %978, %int1_712, %int2_713 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_714 = torch.constant.int 4 %int32_715 = torch.constant.int 32 %int1_716 = torch.constant.int 1 %int100_717 = torch.constant.int 100 %1143 = torch.prim.ListConstruct %int4_714, %int32_715, %int1_716, %int100_717 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_718 = torch.constant.bool false %1144 = torch.aten.expand %1142, %1143, %false_718 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_719 = torch.constant.int 128 %int1_720 = torch.constant.int 1 %int100_721 = torch.constant.int 100 %1145 = torch.prim.ListConstruct %int128_719, %int1_720, %int100_721 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1146 = torch.aten.view %1144, %1145 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_722 = torch.constant.int 0 %int0_723 = torch.constant.int 0 %int9223372036854775807_724 = torch.constant.int 9223372036854775807 %int1_725 = torch.constant.int 1 %1147 = torch.aten.slice.Tensor %1120, %int0_722, %int0_723, %int9223372036854775807_724, %int1_725 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_726 = torch.constant.int 1 %int0_727 = torch.constant.int 0 %int1_728 = torch.constant.int 1 %1148 = torch.aten.slice.Tensor %1147, %int1_726, %int0_727, %1115, %int1_728 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_729 = torch.constant.int 1 %int2_730 = torch.constant.int 2 %1149 = torch.aten.transpose.int %1148, %int1_729, %int2_730 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_731 = torch.constant.int 2 %int3_732 = torch.constant.int 3 %1150 = torch.aten.transpose.int %1149, %int2_731, %int3_732 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_733 = torch.constant.int 1 %1151 = torch.aten.size.int %1139, %int1_733 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_734 = torch.constant.int 4 %int32_735 = torch.constant.int 32 %int100_736 = torch.constant.int 100 %1152 = torch.prim.ListConstruct %int4_734, %int32_735, %int100_736, %1151 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_737 = torch.constant.bool false %1153 = torch.aten.expand %1150, %1152, %false_737 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_738 = torch.constant.int 0 %1154 = torch.aten.clone %1153, %int0_738 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_739 = torch.constant.int 128 %int100_740 = torch.constant.int 100 %1155 = torch.prim.ListConstruct %int128_739, %int100_740, %1151 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1156 = torch.aten._unsafe_view %1154, %1155 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %1157 = torch.aten.bmm %1146, %1156 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_741 = torch.constant.int 4 %int32_742 = torch.constant.int 32 %int1_743 = torch.constant.int 1 %1158 = torch.prim.ListConstruct %int4_741, %int32_742, %int1_743, %1151 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1159 = torch.aten.view %1157, %1158 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_744 = torch.constant.float 1.000000e+01 %1160 = torch.aten.div.Scalar %1159, %float1.000000e01_744 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_745 = torch.constant.int 1 %1161 = torch.aten.add.Tensor %1160, %895, %int1_745 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_746 = torch.constant.int -1 %false_747 = torch.constant.bool false %1162 = torch.aten._softmax %1161, %int-1_746, %false_747 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_748 = torch.constant.int 4 %int32_749 = torch.constant.int 32 %int1_750 = torch.constant.int 1 %1163 = torch.prim.ListConstruct %int4_748, %int32_749, %int1_750, %1151 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_751 = torch.constant.bool false %1164 = torch.aten.expand %1162, %1163, %false_751 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_752 = torch.constant.int 128 %int1_753 = torch.constant.int 1 %1165 = torch.prim.ListConstruct %int128_752, %int1_753, %1151 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1166 = torch.aten.view %1164, %1165 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_754 = torch.constant.int 0 %int0_755 = torch.constant.int 0 %int9223372036854775807_756 = torch.constant.int 9223372036854775807 %int1_757 = torch.constant.int 1 %1167 = torch.aten.slice.Tensor %1137, %int0_754, %int0_755, %int9223372036854775807_756, %int1_757 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_758 = torch.constant.int 1 %int0_759 = torch.constant.int 0 %int1_760 = torch.constant.int 1 %1168 = torch.aten.slice.Tensor %1167, %int1_758, %int0_759, %1115, %int1_760 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_761 = torch.constant.int 1 %int2_762 = torch.constant.int 2 %1169 = torch.aten.transpose.int %1168, %int1_761, %int2_762 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_763 = torch.constant.int 1 %1170 = torch.aten.size.int %1141, %int1_763 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_764 = torch.constant.int 4 %int32_765 = torch.constant.int 32 %int100_766 = torch.constant.int 100 %1171 = torch.prim.ListConstruct %int4_764, %int32_765, %1170, %int100_766 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_767 = torch.constant.bool false %1172 = torch.aten.expand %1169, %1171, %false_767 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_768 = torch.constant.int 0 %1173 = torch.aten.clone %1172, %int0_768 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_769 = torch.constant.int 128 %int100_770 = torch.constant.int 100 %1174 = torch.prim.ListConstruct %int128_769, %1170, %int100_770 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1175 = torch.aten._unsafe_view %1173, %1174 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %1176 = torch.aten.bmm %1166, %1175 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_771 = torch.constant.int 4 %int32_772 = torch.constant.int 32 %int1_773 = torch.constant.int 1 %int100_774 = torch.constant.int 100 %1177 = torch.prim.ListConstruct %int4_771, %int32_772, %int1_773, %int100_774 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1178 = torch.aten.view %1176, %1177 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_775 = torch.constant.int 1 %int2_776 = torch.constant.int 2 %1179 = torch.aten.transpose.int %1178, %int1_775, %int2_776 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_777 = torch.constant.int 4 %int1_778 = torch.constant.int 1 %int-1_779 = torch.constant.int -1 %1180 = torch.prim.ListConstruct %int4_777, %int1_778, %int-1_779 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1181 = torch.aten.view %1179, %1180 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %1182 = torch_c.to_builtin_tensor %1181 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_780 = tensor.cast %1182 : tensor<4x1x3200xf32> to tensor %1183 = torch_c.to_builtin_tensor %15 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1184 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_780, %1183) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_781 = tensor.cast %1184 : tensor to tensor<4x1x3200xf32> %1185 = torch_c.from_builtin_tensor %cast_781 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_782 = torch.constant.int 1 %1186 = torch.aten.add.Tensor %943, %1185, %int1_782 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_783 = torch.constant.int 2 %1187 = torch.aten.pow.Tensor_Scalar %1186, %int2_783 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_784 = torch.constant.int -1 %1188 = torch.prim.ListConstruct %int-1_784 : (!torch.int) -> !torch.list %true_785 = torch.constant.bool true %none_786 = torch.constant.none %1189 = torch.aten.mean.dim %1187, %1188, %true_785, %none_786 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_787 = torch.constant.float 9.9999999747524271E-7 %int1_788 = torch.constant.int 1 %1190 = torch.aten.add.Scalar %1189, %float9.999990e-07_787, %int1_788 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %1191 = torch.aten.rsqrt %1190 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %1192 = torch.aten.mul.Tensor %1186, %1191 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %1193 = torch.aten.mul.Tensor %1192, %16 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %1194 = torch_c.to_builtin_tensor %1193 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_789 = tensor.cast %1194 : tensor<4x1x3200xf32> to tensor %1195 = torch_c.to_builtin_tensor %17 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %1196 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_789, %1195) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_790 = tensor.cast %1196 : tensor to tensor<4x1x8640xf32> %1197 = torch_c.from_builtin_tensor %cast_790 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %1198 = torch.aten.silu %1197 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %1199 = torch_c.to_builtin_tensor %1193 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_791 = tensor.cast %1199 : tensor<4x1x3200xf32> to tensor %1200 = torch_c.to_builtin_tensor %18 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %1201 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_791, %1200) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_792 = tensor.cast %1201 : tensor to tensor<4x1x8640xf32> %1202 = torch_c.from_builtin_tensor %cast_792 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %1203 = torch.aten.mul.Tensor %1198, %1202 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %1204 = torch_c.to_builtin_tensor %1203 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_793 = tensor.cast %1204 : tensor<4x1x8640xf32> to tensor %1205 = torch_c.to_builtin_tensor %19 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %1206 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_793, %1205) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_794 = tensor.cast %1206 : tensor to tensor<4x1x3200xf32> %1207 = torch_c.from_builtin_tensor %cast_794 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_795 = torch.constant.int 1 %1208 = torch.aten.add.Tensor %1186, %1207, %int1_795 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_796 = torch.constant.int 2 %1209 = torch.aten.pow.Tensor_Scalar %1208, %int2_796 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_797 = torch.constant.int -1 %1210 = torch.prim.ListConstruct %int-1_797 : (!torch.int) -> !torch.list %true_798 = torch.constant.bool true %none_799 = torch.constant.none %1211 = torch.aten.mean.dim %1209, %1210, %true_798, %none_799 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_800 = torch.constant.float 9.9999999747524271E-7 %int1_801 = torch.constant.int 1 %1212 = torch.aten.add.Scalar %1211, %float9.999990e-07_800, %int1_801 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %1213 = torch.aten.rsqrt %1212 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %1214 = torch.aten.mul.Tensor %1208, %1213 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %1215 = torch.aten.mul.Tensor %1214, %20 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %1216 = torch_c.to_builtin_tensor %1215 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_802 = tensor.cast %1216 : tensor<4x1x3200xf32> to tensor %1217 = torch_c.to_builtin_tensor %21 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1218 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_802, %1217) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_803 = tensor.cast %1218 : tensor to tensor<4x1x3200xf32> %1219 = torch_c.from_builtin_tensor %cast_803 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %1220 = torch_c.to_builtin_tensor %1215 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_804 = tensor.cast %1220 : tensor<4x1x3200xf32> to tensor %1221 = torch_c.to_builtin_tensor %22 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1222 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_804, %1221) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_805 = tensor.cast %1222 : tensor to tensor<4x1x3200xf32> %1223 = torch_c.from_builtin_tensor %cast_805 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %1224 = torch_c.to_builtin_tensor %1215 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_806 = tensor.cast %1224 : tensor<4x1x3200xf32> to tensor %1225 = torch_c.to_builtin_tensor %23 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1226 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_806, %1225) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_807 = tensor.cast %1226 : tensor to tensor<4x1x3200xf32> %1227 = torch_c.from_builtin_tensor %cast_807 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_808 = torch.constant.int 4 %int1_809 = torch.constant.int 1 %int32_810 = torch.constant.int 32 %int100_811 = torch.constant.int 100 %1228 = torch.prim.ListConstruct %int4_808, %int1_809, %int32_810, %int100_811 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1229 = torch.aten.view %1219, %1228 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_812 = torch.constant.int 4 %int1_813 = torch.constant.int 1 %int32_814 = torch.constant.int 32 %int100_815 = torch.constant.int 100 %1230 = torch.prim.ListConstruct %int4_812, %int1_813, %int32_814, %int100_815 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1231 = torch.aten.view %1223, %1230 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_816 = torch.constant.int 4 %int1_817 = torch.constant.int 1 %int32_818 = torch.constant.int 32 %int100_819 = torch.constant.int 100 %1232 = torch.prim.ListConstruct %int4_816, %int1_817, %int32_818, %int100_819 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1233 = torch.aten.view %1227, %1232 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_820 = torch.constant.int 4 %int1_821 = torch.constant.int 1 %int32_822 = torch.constant.int 32 %int-1_823 = torch.constant.int -1 %int2_824 = torch.constant.int 2 %1234 = torch.prim.ListConstruct %int4_820, %int1_821, %int32_822, %int-1_823, %int2_824 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1235 = torch.aten.view %1229, %1234 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %1236 = torch.aten.view_as_complex %1235 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_825 = torch.constant.int 4 %int1_826 = torch.constant.int 1 %int32_827 = torch.constant.int 32 %int-1_828 = torch.constant.int -1 %int2_829 = torch.constant.int 2 %1237 = torch.prim.ListConstruct %int4_825, %int1_826, %int32_827, %int-1_828, %int2_829 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1238 = torch.aten.view %1231, %1237 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %1239 = torch.aten.view_as_complex %1238 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %1240 = torch.aten.mul.Tensor %1236, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %1241 = torch.aten.view_as_real %1240 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_830 = torch.constant.int 4 %int1_831 = torch.constant.int 1 %int32_832 = torch.constant.int 32 %int100_833 = torch.constant.int 100 %1242 = torch.prim.ListConstruct %int4_830, %int1_831, %int32_832, %int100_833 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1243 = torch.aten.view %1241, %1242 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %1244 = torch.aten.mul.Tensor %1239, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %1245 = torch.aten.view_as_real %1244 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_834 = torch.constant.int 4 %int1_835 = torch.constant.int 1 %int32_836 = torch.constant.int 32 %int100_837 = torch.constant.int 100 %1246 = torch.prim.ListConstruct %int4_834, %int1_835, %int32_836, %int100_837 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1247 = torch.aten.view %1245, %1246 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_838 = torch.constant.int 1 %int1_839 = torch.constant.int 1 %1248 = torch.aten.add.Scalar %arg2, %int1_838, %int1_839 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_840 = torch.constant.int 0 %int0_841 = torch.constant.int 0 %1249 = torch.aten.select.int %1248, %int0_840, %int0_841 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_842 = torch.constant.int 0 %int0_843 = torch.constant.int 0 %1250 = torch.aten.select.int %arg3, %int0_842, %int0_843 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_844 = torch.constant.int 0 %int0_845 = torch.constant.int 0 %int9223372036854775807_846 = torch.constant.int 9223372036854775807 %int1_847 = torch.constant.int 1 %1251 = torch.aten.slice.Tensor %1250, %int0_844, %int0_845, %int9223372036854775807_846, %int1_847 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_848 = torch.constant.int 16 %1252 = torch.aten.floor_divide.Scalar %1249, %int16_848 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_849 = torch.constant.int 0 %1253 = torch.aten.index_select %1251, %int0_849, %1252 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_850 = torch.constant.int 16 %1254 = torch.aten.remainder.Scalar %1249, %int16_850 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_851 = torch.constant.none %1255 = torch.aten.clone %270, %none_851 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_852 = torch.constant.none %1256 = torch.aten.clone %271, %none_852 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_853 = torch.constant.int 0 %1257 = torch.aten.unsqueeze %1254, %int0_853 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_854 = torch.constant.int 0 %int0_855 = torch.constant.int 0 %1258 = torch.aten.select.int %1247, %int0_854, %int0_855 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_856 = torch.constant.int 0 %int0_857 = torch.constant.int 0 %1259 = torch.aten.select.int %1258, %int0_856, %int0_857 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_858 = torch.constant.int -1 %int26_859 = torch.constant.int 26 %int2_860 = torch.constant.int 2 %int16_861 = torch.constant.int 16 %int32_862 = torch.constant.int 32 %int100_863 = torch.constant.int 100 %1260 = torch.prim.ListConstruct %int-1_858, %int26_859, %int2_860, %int16_861, %int32_862, %int100_863 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1261 = torch.aten.view %1095, %1260 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %1262 = torch.prim.ListConstruct %1253, %1255, %1256, %1257 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_864 = torch.constant.bool false %1263 = torch.aten.index_put %1261, %1262, %1259, %false_864 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_865 = torch.constant.int 2662400 %1264 = torch.prim.ListConstruct %731, %int2662400_865 : (!torch.int, !torch.int) -> !torch.list %1265 = torch.aten.view %1263, %1264 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_866 = torch.constant.int -1 %int26_867 = torch.constant.int 26 %int2_868 = torch.constant.int 2 %int16_869 = torch.constant.int 16 %int32_870 = torch.constant.int 32 %int100_871 = torch.constant.int 100 %1266 = torch.prim.ListConstruct %int-1_866, %int26_867, %int2_868, %int16_869, %int32_870, %int100_871 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1267 = torch.aten.view %1265, %1266 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_872 = torch.constant.none %1268 = torch.aten.clone %272, %none_872 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_873 = torch.constant.none %1269 = torch.aten.clone %273, %none_873 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_874 = torch.constant.int 0 %1270 = torch.aten.unsqueeze %1254, %int0_874 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_875 = torch.constant.int 0 %int0_876 = torch.constant.int 0 %1271 = torch.aten.select.int %1233, %int0_875, %int0_876 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_877 = torch.constant.int 0 %int0_878 = torch.constant.int 0 %1272 = torch.aten.select.int %1271, %int0_877, %int0_878 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1273 = torch.prim.ListConstruct %1253, %1268, %1269, %1270 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_879 = torch.constant.bool false %1274 = torch.aten.index_put %1267, %1273, %1272, %false_879 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_880 = torch.constant.int 2662400 %1275 = torch.prim.ListConstruct %731, %int2662400_880 : (!torch.int, !torch.int) -> !torch.list %1276 = torch.aten.view %1274, %1275 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_881 = torch.constant.int -1 %int26_882 = torch.constant.int 26 %int2_883 = torch.constant.int 2 %int16_884 = torch.constant.int 16 %int32_885 = torch.constant.int 32 %int100_886 = torch.constant.int 100 %1277 = torch.prim.ListConstruct %int-1_881, %int26_882, %int2_883, %int16_884, %int32_885, %int100_886 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1278 = torch.aten.view %1276, %1277 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_887 = torch.constant.int 0 %int1_888 = torch.constant.int 1 %1279 = torch.aten.select.int %1248, %int0_887, %int1_888 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_889 = torch.constant.int 0 %int1_890 = torch.constant.int 1 %1280 = torch.aten.select.int %arg3, %int0_889, %int1_890 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_891 = torch.constant.int 0 %int0_892 = torch.constant.int 0 %int9223372036854775807_893 = torch.constant.int 9223372036854775807 %int1_894 = torch.constant.int 1 %1281 = torch.aten.slice.Tensor %1280, %int0_891, %int0_892, %int9223372036854775807_893, %int1_894 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_895 = torch.constant.int 16 %1282 = torch.aten.floor_divide.Scalar %1279, %int16_895 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_896 = torch.constant.int 0 %1283 = torch.aten.index_select %1281, %int0_896, %1282 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_897 = torch.constant.int 16 %1284 = torch.aten.remainder.Scalar %1279, %int16_897 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_898 = torch.constant.none %1285 = torch.aten.clone %274, %none_898 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_899 = torch.constant.none %1286 = torch.aten.clone %275, %none_899 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_900 = torch.constant.int 0 %1287 = torch.aten.unsqueeze %1284, %int0_900 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_901 = torch.constant.int 0 %int1_902 = torch.constant.int 1 %1288 = torch.aten.select.int %1247, %int0_901, %int1_902 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_903 = torch.constant.int 0 %int0_904 = torch.constant.int 0 %1289 = torch.aten.select.int %1288, %int0_903, %int0_904 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1290 = torch.prim.ListConstruct %1283, %1285, %1286, %1287 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_905 = torch.constant.bool false %1291 = torch.aten.index_put %1278, %1290, %1289, %false_905 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_906 = torch.constant.int 2662400 %1292 = torch.prim.ListConstruct %731, %int2662400_906 : (!torch.int, !torch.int) -> !torch.list %1293 = torch.aten.view %1291, %1292 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_907 = torch.constant.int -1 %int26_908 = torch.constant.int 26 %int2_909 = torch.constant.int 2 %int16_910 = torch.constant.int 16 %int32_911 = torch.constant.int 32 %int100_912 = torch.constant.int 100 %1294 = torch.prim.ListConstruct %int-1_907, %int26_908, %int2_909, %int16_910, %int32_911, %int100_912 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1295 = torch.aten.view %1293, %1294 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_913 = torch.constant.none %1296 = torch.aten.clone %276, %none_913 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_914 = torch.constant.none %1297 = torch.aten.clone %277, %none_914 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_915 = torch.constant.int 0 %1298 = torch.aten.unsqueeze %1284, %int0_915 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_916 = torch.constant.int 0 %int1_917 = torch.constant.int 1 %1299 = torch.aten.select.int %1233, %int0_916, %int1_917 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_918 = torch.constant.int 0 %int0_919 = torch.constant.int 0 %1300 = torch.aten.select.int %1299, %int0_918, %int0_919 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1301 = torch.prim.ListConstruct %1283, %1296, %1297, %1298 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_920 = torch.constant.bool false %1302 = torch.aten.index_put %1295, %1301, %1300, %false_920 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_921 = torch.constant.int 2662400 %1303 = torch.prim.ListConstruct %731, %int2662400_921 : (!torch.int, !torch.int) -> !torch.list %1304 = torch.aten.view %1302, %1303 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_922 = torch.constant.int -1 %int26_923 = torch.constant.int 26 %int2_924 = torch.constant.int 2 %int16_925 = torch.constant.int 16 %int32_926 = torch.constant.int 32 %int100_927 = torch.constant.int 100 %1305 = torch.prim.ListConstruct %int-1_922, %int26_923, %int2_924, %int16_925, %int32_926, %int100_927 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1306 = torch.aten.view %1304, %1305 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_928 = torch.constant.int 0 %int2_929 = torch.constant.int 2 %1307 = torch.aten.select.int %1248, %int0_928, %int2_929 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_930 = torch.constant.int 0 %int2_931 = torch.constant.int 2 %1308 = torch.aten.select.int %arg3, %int0_930, %int2_931 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_932 = torch.constant.int 0 %int0_933 = torch.constant.int 0 %int9223372036854775807_934 = torch.constant.int 9223372036854775807 %int1_935 = torch.constant.int 1 %1309 = torch.aten.slice.Tensor %1308, %int0_932, %int0_933, %int9223372036854775807_934, %int1_935 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_936 = torch.constant.int 16 %1310 = torch.aten.floor_divide.Scalar %1307, %int16_936 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_937 = torch.constant.int 0 %1311 = torch.aten.index_select %1309, %int0_937, %1310 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_938 = torch.constant.int 16 %1312 = torch.aten.remainder.Scalar %1307, %int16_938 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_939 = torch.constant.none %1313 = torch.aten.clone %278, %none_939 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_940 = torch.constant.none %1314 = torch.aten.clone %279, %none_940 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_941 = torch.constant.int 0 %1315 = torch.aten.unsqueeze %1312, %int0_941 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_942 = torch.constant.int 0 %int2_943 = torch.constant.int 2 %1316 = torch.aten.select.int %1247, %int0_942, %int2_943 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_944 = torch.constant.int 0 %int0_945 = torch.constant.int 0 %1317 = torch.aten.select.int %1316, %int0_944, %int0_945 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1318 = torch.prim.ListConstruct %1311, %1313, %1314, %1315 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_946 = torch.constant.bool false %1319 = torch.aten.index_put %1306, %1318, %1317, %false_946 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_947 = torch.constant.int 2662400 %1320 = torch.prim.ListConstruct %731, %int2662400_947 : (!torch.int, !torch.int) -> !torch.list %1321 = torch.aten.view %1319, %1320 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_948 = torch.constant.int -1 %int26_949 = torch.constant.int 26 %int2_950 = torch.constant.int 2 %int16_951 = torch.constant.int 16 %int32_952 = torch.constant.int 32 %int100_953 = torch.constant.int 100 %1322 = torch.prim.ListConstruct %int-1_948, %int26_949, %int2_950, %int16_951, %int32_952, %int100_953 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1323 = torch.aten.view %1321, %1322 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_954 = torch.constant.none %1324 = torch.aten.clone %280, %none_954 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_955 = torch.constant.none %1325 = torch.aten.clone %281, %none_955 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_956 = torch.constant.int 0 %1326 = torch.aten.unsqueeze %1312, %int0_956 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_957 = torch.constant.int 0 %int2_958 = torch.constant.int 2 %1327 = torch.aten.select.int %1233, %int0_957, %int2_958 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_959 = torch.constant.int 0 %int0_960 = torch.constant.int 0 %1328 = torch.aten.select.int %1327, %int0_959, %int0_960 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1329 = torch.prim.ListConstruct %1311, %1324, %1325, %1326 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_961 = torch.constant.bool false %1330 = torch.aten.index_put %1323, %1329, %1328, %false_961 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_962 = torch.constant.int 2662400 %1331 = torch.prim.ListConstruct %731, %int2662400_962 : (!torch.int, !torch.int) -> !torch.list %1332 = torch.aten.view %1330, %1331 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_963 = torch.constant.int -1 %int26_964 = torch.constant.int 26 %int2_965 = torch.constant.int 2 %int16_966 = torch.constant.int 16 %int32_967 = torch.constant.int 32 %int100_968 = torch.constant.int 100 %1333 = torch.prim.ListConstruct %int-1_963, %int26_964, %int2_965, %int16_966, %int32_967, %int100_968 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1334 = torch.aten.view %1332, %1333 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_969 = torch.constant.int 0 %int3_970 = torch.constant.int 3 %1335 = torch.aten.select.int %1248, %int0_969, %int3_970 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_971 = torch.constant.int 0 %int3_972 = torch.constant.int 3 %1336 = torch.aten.select.int %arg3, %int0_971, %int3_972 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_973 = torch.constant.int 0 %int0_974 = torch.constant.int 0 %int9223372036854775807_975 = torch.constant.int 9223372036854775807 %int1_976 = torch.constant.int 1 %1337 = torch.aten.slice.Tensor %1336, %int0_973, %int0_974, %int9223372036854775807_975, %int1_976 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_977 = torch.constant.int 16 %1338 = torch.aten.floor_divide.Scalar %1335, %int16_977 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_978 = torch.constant.int 0 %1339 = torch.aten.index_select %1337, %int0_978, %1338 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_979 = torch.constant.int 16 %1340 = torch.aten.remainder.Scalar %1335, %int16_979 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_980 = torch.constant.none %1341 = torch.aten.clone %282, %none_980 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_981 = torch.constant.none %1342 = torch.aten.clone %283, %none_981 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_982 = torch.constant.int 0 %1343 = torch.aten.unsqueeze %1340, %int0_982 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_983 = torch.constant.int 0 %int3_984 = torch.constant.int 3 %1344 = torch.aten.select.int %1247, %int0_983, %int3_984 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_985 = torch.constant.int 0 %int0_986 = torch.constant.int 0 %1345 = torch.aten.select.int %1344, %int0_985, %int0_986 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1346 = torch.prim.ListConstruct %1339, %1341, %1342, %1343 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_987 = torch.constant.bool false %1347 = torch.aten.index_put %1334, %1346, %1345, %false_987 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_988 = torch.constant.int 2662400 %1348 = torch.prim.ListConstruct %731, %int2662400_988 : (!torch.int, !torch.int) -> !torch.list %1349 = torch.aten.view %1347, %1348 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_989 = torch.constant.int -1 %int26_990 = torch.constant.int 26 %int2_991 = torch.constant.int 2 %int16_992 = torch.constant.int 16 %int32_993 = torch.constant.int 32 %int100_994 = torch.constant.int 100 %1350 = torch.prim.ListConstruct %int-1_989, %int26_990, %int2_991, %int16_992, %int32_993, %int100_994 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1351 = torch.aten.view %1349, %1350 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_995 = torch.constant.none %1352 = torch.aten.clone %284, %none_995 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_996 = torch.constant.none %1353 = torch.aten.clone %285, %none_996 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_997 = torch.constant.int 0 %1354 = torch.aten.unsqueeze %1340, %int0_997 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_998 = torch.constant.int 0 %int3_999 = torch.constant.int 3 %1355 = torch.aten.select.int %1233, %int0_998, %int3_999 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1000 = torch.constant.int 0 %int0_1001 = torch.constant.int 0 %1356 = torch.aten.select.int %1355, %int0_1000, %int0_1001 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1357 = torch.prim.ListConstruct %1339, %1352, %1353, %1354 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1002 = torch.constant.bool false %1358 = torch.aten.index_put %1351, %1357, %1356, %false_1002 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1003 = torch.constant.int 2662400 %1359 = torch.prim.ListConstruct %731, %int2662400_1003 : (!torch.int, !torch.int) -> !torch.list %1360 = torch.aten.view %1358, %1359 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_1004 = torch.constant.int 52 %1361 = torch.aten.mul.Scalar %arg3, %int52_1004 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int4_1005 = torch.constant.int 4 %int1_1006 = torch.constant.int 1 %1362 = torch.aten.add.Scalar %1361, %int4_1005, %int1_1006 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_1007 = torch.constant.int 4 %1363 = torch.aten.mul.int %int4_1007, %655 : !torch.int, !torch.int -> !torch.int %1364 = torch.prim.ListConstruct %1363 : (!torch.int) -> !torch.list %1365 = torch.aten.view %1362, %1364 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_1008 = torch.constant.int -1 %int26_1009 = torch.constant.int 26 %int2_1010 = torch.constant.int 2 %int16_1011 = torch.constant.int 16 %int32_1012 = torch.constant.int 32 %int100_1013 = torch.constant.int 100 %1366 = torch.prim.ListConstruct %int-1_1008, %int26_1009, %int2_1010, %int16_1011, %int32_1012, %int100_1013 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1367 = torch.aten.view %1360, %1366 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_1014 = torch.constant.int 26 %1368 = torch.aten.mul.int %731, %int26_1014 : !torch.int, !torch.int -> !torch.int %int2_1015 = torch.constant.int 2 %1369 = torch.aten.mul.int %1368, %int2_1015 : !torch.int, !torch.int -> !torch.int %int16_1016 = torch.constant.int 16 %int32_1017 = torch.constant.int 32 %int100_1018 = torch.constant.int 100 %1370 = torch.prim.ListConstruct %1369, %int16_1016, %int32_1017, %int100_1018 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1371 = torch.aten.view %1367, %1370 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_1019 = torch.constant.int 0 %1372 = torch.aten.index_select %1371, %int0_1019, %1365 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_1020 = torch.constant.int 4 %int16_1021 = torch.constant.int 16 %int32_1022 = torch.constant.int 32 %int100_1023 = torch.constant.int 100 %1373 = torch.prim.ListConstruct %int4_1020, %655, %int16_1021, %int32_1022, %int100_1023 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1374 = torch.aten.view %1372, %1373 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_1024 = torch.constant.int 1 %1375 = torch.aten.size.int %1374, %int1_1024 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_1025 = torch.constant.int 16 %1376 = torch.aten.mul.int %1375, %int16_1025 : !torch.int, !torch.int -> !torch.int %int4_1026 = torch.constant.int 4 %int32_1027 = torch.constant.int 32 %int100_1028 = torch.constant.int 100 %1377 = torch.prim.ListConstruct %int4_1026, %1376, %int32_1027, %int100_1028 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1378 = torch.aten.view %1374, %1377 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_1029 = torch.constant.int 0 %int0_1030 = torch.constant.int 0 %int9223372036854775807_1031 = torch.constant.int 9223372036854775807 %int1_1032 = torch.constant.int 1 %1379 = torch.aten.slice.Tensor %1120, %int0_1029, %int0_1030, %int9223372036854775807_1031, %int1_1032 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_1033 = torch.constant.int 16 %1380 = torch.aten.mul.int %655, %int16_1033 : !torch.int, !torch.int -> !torch.int %int1_1034 = torch.constant.int 1 %int0_1035 = torch.constant.int 0 %int1_1036 = torch.constant.int 1 %1381 = torch.aten.slice.Tensor %1379, %int1_1034, %int0_1035, %1380, %int1_1036 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_1037 = torch.constant.bool false %1382 = torch.aten.copy %1381, %1378, %false_1037 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_1038 = torch.constant.int 0 %int0_1039 = torch.constant.int 0 %int9223372036854775807_1040 = torch.constant.int 9223372036854775807 %int1_1041 = torch.constant.int 1 %1383 = torch.aten.slice.Tensor %1120, %int0_1038, %int0_1039, %int9223372036854775807_1040, %int1_1041 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1042 = torch.constant.int 1 %int0_1043 = torch.constant.int 0 %int1_1044 = torch.constant.int 1 %1384 = torch.aten.slice_scatter %1383, %1382, %int1_1042, %int0_1043, %1380, %int1_1044 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_1045 = torch.constant.int 0 %int0_1046 = torch.constant.int 0 %int9223372036854775807_1047 = torch.constant.int 9223372036854775807 %int1_1048 = torch.constant.int 1 %1385 = torch.aten.slice_scatter %1120, %1384, %int0_1045, %int0_1046, %int9223372036854775807_1047, %int1_1048 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1049 = torch.constant.int 1 %int1_1050 = torch.constant.int 1 %1386 = torch.aten.add.Scalar %1362, %int1_1049, %int1_1050 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_1051 = torch.constant.int 4 %1387 = torch.aten.mul.int %int4_1051, %655 : !torch.int, !torch.int -> !torch.int %1388 = torch.prim.ListConstruct %1387 : (!torch.int) -> !torch.list %1389 = torch.aten.view %1386, %1388 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_1052 = torch.constant.int 0 %1390 = torch.aten.index_select %1371, %int0_1052, %1389 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_1053 = torch.constant.int 4 %int16_1054 = torch.constant.int 16 %int32_1055 = torch.constant.int 32 %int100_1056 = torch.constant.int 100 %1391 = torch.prim.ListConstruct %int4_1053, %655, %int16_1054, %int32_1055, %int100_1056 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1392 = torch.aten.view %1390, %1391 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_1057 = torch.constant.int 1 %1393 = torch.aten.size.int %1392, %int1_1057 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_1058 = torch.constant.int 16 %1394 = torch.aten.mul.int %1393, %int16_1058 : !torch.int, !torch.int -> !torch.int %int4_1059 = torch.constant.int 4 %int32_1060 = torch.constant.int 32 %int100_1061 = torch.constant.int 100 %1395 = torch.prim.ListConstruct %int4_1059, %1394, %int32_1060, %int100_1061 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1396 = torch.aten.view %1392, %1395 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_1062 = torch.constant.int 0 %int0_1063 = torch.constant.int 0 %int9223372036854775807_1064 = torch.constant.int 9223372036854775807 %int1_1065 = torch.constant.int 1 %1397 = torch.aten.slice.Tensor %1137, %int0_1062, %int0_1063, %int9223372036854775807_1064, %int1_1065 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1066 = torch.constant.int 1 %int0_1067 = torch.constant.int 0 %int1_1068 = torch.constant.int 1 %1398 = torch.aten.slice.Tensor %1397, %int1_1066, %int0_1067, %1380, %int1_1068 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_1069 = torch.constant.bool false %1399 = torch.aten.copy %1398, %1396, %false_1069 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_1070 = torch.constant.int 0 %int0_1071 = torch.constant.int 0 %int9223372036854775807_1072 = torch.constant.int 9223372036854775807 %int1_1073 = torch.constant.int 1 %1400 = torch.aten.slice.Tensor %1137, %int0_1070, %int0_1071, %int9223372036854775807_1072, %int1_1073 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1074 = torch.constant.int 1 %int0_1075 = torch.constant.int 0 %int1_1076 = torch.constant.int 1 %1401 = torch.aten.slice_scatter %1400, %1399, %int1_1074, %int0_1075, %1380, %int1_1076 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_1077 = torch.constant.int 0 %int0_1078 = torch.constant.int 0 %int9223372036854775807_1079 = torch.constant.int 9223372036854775807 %int1_1080 = torch.constant.int 1 %1402 = torch.aten.slice_scatter %1137, %1401, %int0_1077, %int0_1078, %int9223372036854775807_1079, %int1_1080 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_1081 = torch.constant.int 0 %int0_1082 = torch.constant.int 0 %int9223372036854775807_1083 = torch.constant.int 9223372036854775807 %int1_1084 = torch.constant.int 1 %1403 = torch.aten.slice.Tensor %671, %int0_1081, %int0_1082, %int9223372036854775807_1083, %int1_1084 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1085 = torch.constant.int 1 %int0_1086 = torch.constant.int 0 %int1_1087 = torch.constant.int 1 %1404 = torch.aten.slice.Tensor %1403, %int1_1085, %int0_1086, %1380, %int1_1087 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_1088 = torch.constant.int 0 %int0_1089 = torch.constant.int 0 %int9223372036854775807_1090 = torch.constant.int 9223372036854775807 %int1_1091 = torch.constant.int 1 %1405 = torch.aten.slice.Tensor %673, %int0_1088, %int0_1089, %int9223372036854775807_1090, %int1_1091 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1092 = torch.constant.int 1 %int0_1093 = torch.constant.int 0 %int1_1094 = torch.constant.int 1 %1406 = torch.aten.slice.Tensor %1405, %int1_1092, %int0_1093, %1380, %int1_1094 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_1095 = torch.constant.int 1 %int2_1096 = torch.constant.int 2 %1407 = torch.aten.transpose.int %1243, %int1_1095, %int2_1096 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_1097 = torch.constant.int 4 %int32_1098 = torch.constant.int 32 %int1_1099 = torch.constant.int 1 %int100_1100 = torch.constant.int 100 %1408 = torch.prim.ListConstruct %int4_1097, %int32_1098, %int1_1099, %int100_1100 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1101 = torch.constant.bool false %1409 = torch.aten.expand %1407, %1408, %false_1101 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_1102 = torch.constant.int 128 %int1_1103 = torch.constant.int 1 %int100_1104 = torch.constant.int 100 %1410 = torch.prim.ListConstruct %int128_1102, %int1_1103, %int100_1104 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1411 = torch.aten.view %1409, %1410 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_1105 = torch.constant.int 0 %int0_1106 = torch.constant.int 0 %int9223372036854775807_1107 = torch.constant.int 9223372036854775807 %int1_1108 = torch.constant.int 1 %1412 = torch.aten.slice.Tensor %1385, %int0_1105, %int0_1106, %int9223372036854775807_1107, %int1_1108 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1109 = torch.constant.int 1 %int0_1110 = torch.constant.int 0 %int1_1111 = torch.constant.int 1 %1413 = torch.aten.slice.Tensor %1412, %int1_1109, %int0_1110, %1380, %int1_1111 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_1112 = torch.constant.int 1 %int2_1113 = torch.constant.int 2 %1414 = torch.aten.transpose.int %1413, %int1_1112, %int2_1113 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_1114 = torch.constant.int 2 %int3_1115 = torch.constant.int 3 %1415 = torch.aten.transpose.int %1414, %int2_1114, %int3_1115 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_1116 = torch.constant.int 1 %1416 = torch.aten.size.int %1404, %int1_1116 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_1117 = torch.constant.int 4 %int32_1118 = torch.constant.int 32 %int100_1119 = torch.constant.int 100 %1417 = torch.prim.ListConstruct %int4_1117, %int32_1118, %int100_1119, %1416 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1120 = torch.constant.bool false %1418 = torch.aten.expand %1415, %1417, %false_1120 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_1121 = torch.constant.int 0 %1419 = torch.aten.clone %1418, %int0_1121 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_1122 = torch.constant.int 128 %int100_1123 = torch.constant.int 100 %1420 = torch.prim.ListConstruct %int128_1122, %int100_1123, %1416 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1421 = torch.aten._unsafe_view %1419, %1420 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %1422 = torch.aten.bmm %1411, %1421 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_1124 = torch.constant.int 4 %int32_1125 = torch.constant.int 32 %int1_1126 = torch.constant.int 1 %1423 = torch.prim.ListConstruct %int4_1124, %int32_1125, %int1_1126, %1416 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1424 = torch.aten.view %1422, %1423 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_1127 = torch.constant.float 1.000000e+01 %1425 = torch.aten.div.Scalar %1424, %float1.000000e01_1127 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_1128 = torch.constant.int 1 %1426 = torch.aten.add.Tensor %1425, %895, %int1_1128 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_1129 = torch.constant.int -1 %false_1130 = torch.constant.bool false %1427 = torch.aten._softmax %1426, %int-1_1129, %false_1130 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_1131 = torch.constant.int 4 %int32_1132 = torch.constant.int 32 %int1_1133 = torch.constant.int 1 %1428 = torch.prim.ListConstruct %int4_1131, %int32_1132, %int1_1133, %1416 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1134 = torch.constant.bool false %1429 = torch.aten.expand %1427, %1428, %false_1134 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_1135 = torch.constant.int 128 %int1_1136 = torch.constant.int 1 %1430 = torch.prim.ListConstruct %int128_1135, %int1_1136, %1416 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1431 = torch.aten.view %1429, %1430 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_1137 = torch.constant.int 0 %int0_1138 = torch.constant.int 0 %int9223372036854775807_1139 = torch.constant.int 9223372036854775807 %int1_1140 = torch.constant.int 1 %1432 = torch.aten.slice.Tensor %1402, %int0_1137, %int0_1138, %int9223372036854775807_1139, %int1_1140 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1141 = torch.constant.int 1 %int0_1142 = torch.constant.int 0 %int1_1143 = torch.constant.int 1 %1433 = torch.aten.slice.Tensor %1432, %int1_1141, %int0_1142, %1380, %int1_1143 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_1144 = torch.constant.int 1 %int2_1145 = torch.constant.int 2 %1434 = torch.aten.transpose.int %1433, %int1_1144, %int2_1145 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_1146 = torch.constant.int 1 %1435 = torch.aten.size.int %1406, %int1_1146 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_1147 = torch.constant.int 4 %int32_1148 = torch.constant.int 32 %int100_1149 = torch.constant.int 100 %1436 = torch.prim.ListConstruct %int4_1147, %int32_1148, %1435, %int100_1149 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1150 = torch.constant.bool false %1437 = torch.aten.expand %1434, %1436, %false_1150 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_1151 = torch.constant.int 0 %1438 = torch.aten.clone %1437, %int0_1151 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_1152 = torch.constant.int 128 %int100_1153 = torch.constant.int 100 %1439 = torch.prim.ListConstruct %int128_1152, %1435, %int100_1153 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1440 = torch.aten._unsafe_view %1438, %1439 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %1441 = torch.aten.bmm %1431, %1440 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_1154 = torch.constant.int 4 %int32_1155 = torch.constant.int 32 %int1_1156 = torch.constant.int 1 %int100_1157 = torch.constant.int 100 %1442 = torch.prim.ListConstruct %int4_1154, %int32_1155, %int1_1156, %int100_1157 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1443 = torch.aten.view %1441, %1442 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_1158 = torch.constant.int 1 %int2_1159 = torch.constant.int 2 %1444 = torch.aten.transpose.int %1443, %int1_1158, %int2_1159 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_1160 = torch.constant.int 4 %int1_1161 = torch.constant.int 1 %int-1_1162 = torch.constant.int -1 %1445 = torch.prim.ListConstruct %int4_1160, %int1_1161, %int-1_1162 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1446 = torch.aten.view %1444, %1445 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %1447 = torch_c.to_builtin_tensor %1446 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1163 = tensor.cast %1447 : tensor<4x1x3200xf32> to tensor %1448 = torch_c.to_builtin_tensor %24 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1449 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1163, %1448) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1164 = tensor.cast %1449 : tensor to tensor<4x1x3200xf32> %1450 = torch_c.from_builtin_tensor %cast_1164 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_1165 = torch.constant.int 1 %1451 = torch.aten.add.Tensor %1208, %1450, %int1_1165 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_1166 = torch.constant.int 2 %1452 = torch.aten.pow.Tensor_Scalar %1451, %int2_1166 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_1167 = torch.constant.int -1 %1453 = torch.prim.ListConstruct %int-1_1167 : (!torch.int) -> !torch.list %true_1168 = torch.constant.bool true %none_1169 = torch.constant.none %1454 = torch.aten.mean.dim %1452, %1453, %true_1168, %none_1169 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_1170 = torch.constant.float 9.9999999747524271E-7 %int1_1171 = torch.constant.int 1 %1455 = torch.aten.add.Scalar %1454, %float9.999990e-07_1170, %int1_1171 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %1456 = torch.aten.rsqrt %1455 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %1457 = torch.aten.mul.Tensor %1451, %1456 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %1458 = torch.aten.mul.Tensor %1457, %25 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %1459 = torch_c.to_builtin_tensor %1458 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1172 = tensor.cast %1459 : tensor<4x1x3200xf32> to tensor %1460 = torch_c.to_builtin_tensor %26 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %1461 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_1172, %1460) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_1173 = tensor.cast %1461 : tensor to tensor<4x1x8640xf32> %1462 = torch_c.from_builtin_tensor %cast_1173 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %1463 = torch.aten.silu %1462 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %1464 = torch_c.to_builtin_tensor %1458 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1174 = tensor.cast %1464 : tensor<4x1x3200xf32> to tensor %1465 = torch_c.to_builtin_tensor %27 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %1466 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_1174, %1465) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_1175 = tensor.cast %1466 : tensor to tensor<4x1x8640xf32> %1467 = torch_c.from_builtin_tensor %cast_1175 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %1468 = torch.aten.mul.Tensor %1463, %1467 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %1469 = torch_c.to_builtin_tensor %1468 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_1176 = tensor.cast %1469 : tensor<4x1x8640xf32> to tensor %1470 = torch_c.to_builtin_tensor %28 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %1471 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_1176, %1470) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_1177 = tensor.cast %1471 : tensor to tensor<4x1x3200xf32> %1472 = torch_c.from_builtin_tensor %cast_1177 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_1178 = torch.constant.int 1 %1473 = torch.aten.add.Tensor %1451, %1472, %int1_1178 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_1179 = torch.constant.int 2 %1474 = torch.aten.pow.Tensor_Scalar %1473, %int2_1179 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_1180 = torch.constant.int -1 %1475 = torch.prim.ListConstruct %int-1_1180 : (!torch.int) -> !torch.list %true_1181 = torch.constant.bool true %none_1182 = torch.constant.none %1476 = torch.aten.mean.dim %1474, %1475, %true_1181, %none_1182 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_1183 = torch.constant.float 9.9999999747524271E-7 %int1_1184 = torch.constant.int 1 %1477 = torch.aten.add.Scalar %1476, %float9.999990e-07_1183, %int1_1184 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %1478 = torch.aten.rsqrt %1477 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %1479 = torch.aten.mul.Tensor %1473, %1478 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %1480 = torch.aten.mul.Tensor %1479, %29 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %1481 = torch_c.to_builtin_tensor %1480 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1185 = tensor.cast %1481 : tensor<4x1x3200xf32> to tensor %1482 = torch_c.to_builtin_tensor %30 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1483 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1185, %1482) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1186 = tensor.cast %1483 : tensor to tensor<4x1x3200xf32> %1484 = torch_c.from_builtin_tensor %cast_1186 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %1485 = torch_c.to_builtin_tensor %1480 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1187 = tensor.cast %1485 : tensor<4x1x3200xf32> to tensor %1486 = torch_c.to_builtin_tensor %31 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1487 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1187, %1486) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1188 = tensor.cast %1487 : tensor to tensor<4x1x3200xf32> %1488 = torch_c.from_builtin_tensor %cast_1188 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %1489 = torch_c.to_builtin_tensor %1480 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1189 = tensor.cast %1489 : tensor<4x1x3200xf32> to tensor %1490 = torch_c.to_builtin_tensor %32 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1491 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1189, %1490) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1190 = tensor.cast %1491 : tensor to tensor<4x1x3200xf32> %1492 = torch_c.from_builtin_tensor %cast_1190 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_1191 = torch.constant.int 4 %int1_1192 = torch.constant.int 1 %int32_1193 = torch.constant.int 32 %int100_1194 = torch.constant.int 100 %1493 = torch.prim.ListConstruct %int4_1191, %int1_1192, %int32_1193, %int100_1194 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1494 = torch.aten.view %1484, %1493 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_1195 = torch.constant.int 4 %int1_1196 = torch.constant.int 1 %int32_1197 = torch.constant.int 32 %int100_1198 = torch.constant.int 100 %1495 = torch.prim.ListConstruct %int4_1195, %int1_1196, %int32_1197, %int100_1198 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1496 = torch.aten.view %1488, %1495 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_1199 = torch.constant.int 4 %int1_1200 = torch.constant.int 1 %int32_1201 = torch.constant.int 32 %int100_1202 = torch.constant.int 100 %1497 = torch.prim.ListConstruct %int4_1199, %int1_1200, %int32_1201, %int100_1202 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1498 = torch.aten.view %1492, %1497 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_1203 = torch.constant.int 4 %int1_1204 = torch.constant.int 1 %int32_1205 = torch.constant.int 32 %int-1_1206 = torch.constant.int -1 %int2_1207 = torch.constant.int 2 %1499 = torch.prim.ListConstruct %int4_1203, %int1_1204, %int32_1205, %int-1_1206, %int2_1207 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1500 = torch.aten.view %1494, %1499 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %1501 = torch.aten.view_as_complex %1500 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_1208 = torch.constant.int 4 %int1_1209 = torch.constant.int 1 %int32_1210 = torch.constant.int 32 %int-1_1211 = torch.constant.int -1 %int2_1212 = torch.constant.int 2 %1502 = torch.prim.ListConstruct %int4_1208, %int1_1209, %int32_1210, %int-1_1211, %int2_1212 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1503 = torch.aten.view %1496, %1502 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %1504 = torch.aten.view_as_complex %1503 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %1505 = torch.aten.mul.Tensor %1501, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %1506 = torch.aten.view_as_real %1505 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_1213 = torch.constant.int 4 %int1_1214 = torch.constant.int 1 %int32_1215 = torch.constant.int 32 %int100_1216 = torch.constant.int 100 %1507 = torch.prim.ListConstruct %int4_1213, %int1_1214, %int32_1215, %int100_1216 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1508 = torch.aten.view %1506, %1507 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %1509 = torch.aten.mul.Tensor %1504, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %1510 = torch.aten.view_as_real %1509 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_1217 = torch.constant.int 4 %int1_1218 = torch.constant.int 1 %int32_1219 = torch.constant.int 32 %int100_1220 = torch.constant.int 100 %1511 = torch.prim.ListConstruct %int4_1217, %int1_1218, %int32_1219, %int100_1220 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1512 = torch.aten.view %1510, %1511 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_1221 = torch.constant.int 1 %int1_1222 = torch.constant.int 1 %1513 = torch.aten.add.Scalar %arg2, %int1_1221, %int1_1222 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_1223 = torch.constant.int 0 %int0_1224 = torch.constant.int 0 %1514 = torch.aten.select.int %1513, %int0_1223, %int0_1224 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_1225 = torch.constant.int 0 %int0_1226 = torch.constant.int 0 %1515 = torch.aten.select.int %arg3, %int0_1225, %int0_1226 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_1227 = torch.constant.int 0 %int0_1228 = torch.constant.int 0 %int9223372036854775807_1229 = torch.constant.int 9223372036854775807 %int1_1230 = torch.constant.int 1 %1516 = torch.aten.slice.Tensor %1515, %int0_1227, %int0_1228, %int9223372036854775807_1229, %int1_1230 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_1231 = torch.constant.int 16 %1517 = torch.aten.floor_divide.Scalar %1514, %int16_1231 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_1232 = torch.constant.int 0 %1518 = torch.aten.index_select %1516, %int0_1232, %1517 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_1233 = torch.constant.int 16 %1519 = torch.aten.remainder.Scalar %1514, %int16_1233 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_1234 = torch.constant.none %1520 = torch.aten.clone %286, %none_1234 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1235 = torch.constant.none %1521 = torch.aten.clone %287, %none_1235 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1236 = torch.constant.int 0 %1522 = torch.aten.unsqueeze %1519, %int0_1236 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1237 = torch.constant.int 0 %int0_1238 = torch.constant.int 0 %1523 = torch.aten.select.int %1512, %int0_1237, %int0_1238 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1239 = torch.constant.int 0 %int0_1240 = torch.constant.int 0 %1524 = torch.aten.select.int %1523, %int0_1239, %int0_1240 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_1241 = torch.constant.int -1 %int26_1242 = torch.constant.int 26 %int2_1243 = torch.constant.int 2 %int16_1244 = torch.constant.int 16 %int32_1245 = torch.constant.int 32 %int100_1246 = torch.constant.int 100 %1525 = torch.prim.ListConstruct %int-1_1241, %int26_1242, %int2_1243, %int16_1244, %int32_1245, %int100_1246 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1526 = torch.aten.view %1360, %1525 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %1527 = torch.prim.ListConstruct %1518, %1520, %1521, %1522 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1247 = torch.constant.bool false %1528 = torch.aten.index_put %1526, %1527, %1524, %false_1247 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1248 = torch.constant.int 2662400 %1529 = torch.prim.ListConstruct %731, %int2662400_1248 : (!torch.int, !torch.int) -> !torch.list %1530 = torch.aten.view %1528, %1529 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1249 = torch.constant.int -1 %int26_1250 = torch.constant.int 26 %int2_1251 = torch.constant.int 2 %int16_1252 = torch.constant.int 16 %int32_1253 = torch.constant.int 32 %int100_1254 = torch.constant.int 100 %1531 = torch.prim.ListConstruct %int-1_1249, %int26_1250, %int2_1251, %int16_1252, %int32_1253, %int100_1254 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1532 = torch.aten.view %1530, %1531 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_1255 = torch.constant.none %1533 = torch.aten.clone %288, %none_1255 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1256 = torch.constant.none %1534 = torch.aten.clone %289, %none_1256 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1257 = torch.constant.int 0 %1535 = torch.aten.unsqueeze %1519, %int0_1257 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1258 = torch.constant.int 0 %int0_1259 = torch.constant.int 0 %1536 = torch.aten.select.int %1498, %int0_1258, %int0_1259 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1260 = torch.constant.int 0 %int0_1261 = torch.constant.int 0 %1537 = torch.aten.select.int %1536, %int0_1260, %int0_1261 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1538 = torch.prim.ListConstruct %1518, %1533, %1534, %1535 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1262 = torch.constant.bool false %1539 = torch.aten.index_put %1532, %1538, %1537, %false_1262 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1263 = torch.constant.int 2662400 %1540 = torch.prim.ListConstruct %731, %int2662400_1263 : (!torch.int, !torch.int) -> !torch.list %1541 = torch.aten.view %1539, %1540 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1264 = torch.constant.int -1 %int26_1265 = torch.constant.int 26 %int2_1266 = torch.constant.int 2 %int16_1267 = torch.constant.int 16 %int32_1268 = torch.constant.int 32 %int100_1269 = torch.constant.int 100 %1542 = torch.prim.ListConstruct %int-1_1264, %int26_1265, %int2_1266, %int16_1267, %int32_1268, %int100_1269 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1543 = torch.aten.view %1541, %1542 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_1270 = torch.constant.int 0 %int1_1271 = torch.constant.int 1 %1544 = torch.aten.select.int %1513, %int0_1270, %int1_1271 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_1272 = torch.constant.int 0 %int1_1273 = torch.constant.int 1 %1545 = torch.aten.select.int %arg3, %int0_1272, %int1_1273 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_1274 = torch.constant.int 0 %int0_1275 = torch.constant.int 0 %int9223372036854775807_1276 = torch.constant.int 9223372036854775807 %int1_1277 = torch.constant.int 1 %1546 = torch.aten.slice.Tensor %1545, %int0_1274, %int0_1275, %int9223372036854775807_1276, %int1_1277 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_1278 = torch.constant.int 16 %1547 = torch.aten.floor_divide.Scalar %1544, %int16_1278 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_1279 = torch.constant.int 0 %1548 = torch.aten.index_select %1546, %int0_1279, %1547 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_1280 = torch.constant.int 16 %1549 = torch.aten.remainder.Scalar %1544, %int16_1280 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_1281 = torch.constant.none %1550 = torch.aten.clone %290, %none_1281 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1282 = torch.constant.none %1551 = torch.aten.clone %291, %none_1282 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1283 = torch.constant.int 0 %1552 = torch.aten.unsqueeze %1549, %int0_1283 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1284 = torch.constant.int 0 %int1_1285 = torch.constant.int 1 %1553 = torch.aten.select.int %1512, %int0_1284, %int1_1285 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1286 = torch.constant.int 0 %int0_1287 = torch.constant.int 0 %1554 = torch.aten.select.int %1553, %int0_1286, %int0_1287 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1555 = torch.prim.ListConstruct %1548, %1550, %1551, %1552 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1288 = torch.constant.bool false %1556 = torch.aten.index_put %1543, %1555, %1554, %false_1288 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1289 = torch.constant.int 2662400 %1557 = torch.prim.ListConstruct %731, %int2662400_1289 : (!torch.int, !torch.int) -> !torch.list %1558 = torch.aten.view %1556, %1557 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1290 = torch.constant.int -1 %int26_1291 = torch.constant.int 26 %int2_1292 = torch.constant.int 2 %int16_1293 = torch.constant.int 16 %int32_1294 = torch.constant.int 32 %int100_1295 = torch.constant.int 100 %1559 = torch.prim.ListConstruct %int-1_1290, %int26_1291, %int2_1292, %int16_1293, %int32_1294, %int100_1295 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1560 = torch.aten.view %1558, %1559 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_1296 = torch.constant.none %1561 = torch.aten.clone %292, %none_1296 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1297 = torch.constant.none %1562 = torch.aten.clone %293, %none_1297 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1298 = torch.constant.int 0 %1563 = torch.aten.unsqueeze %1549, %int0_1298 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1299 = torch.constant.int 0 %int1_1300 = torch.constant.int 1 %1564 = torch.aten.select.int %1498, %int0_1299, %int1_1300 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1301 = torch.constant.int 0 %int0_1302 = torch.constant.int 0 %1565 = torch.aten.select.int %1564, %int0_1301, %int0_1302 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1566 = torch.prim.ListConstruct %1548, %1561, %1562, %1563 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1303 = torch.constant.bool false %1567 = torch.aten.index_put %1560, %1566, %1565, %false_1303 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1304 = torch.constant.int 2662400 %1568 = torch.prim.ListConstruct %731, %int2662400_1304 : (!torch.int, !torch.int) -> !torch.list %1569 = torch.aten.view %1567, %1568 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1305 = torch.constant.int -1 %int26_1306 = torch.constant.int 26 %int2_1307 = torch.constant.int 2 %int16_1308 = torch.constant.int 16 %int32_1309 = torch.constant.int 32 %int100_1310 = torch.constant.int 100 %1570 = torch.prim.ListConstruct %int-1_1305, %int26_1306, %int2_1307, %int16_1308, %int32_1309, %int100_1310 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1571 = torch.aten.view %1569, %1570 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_1311 = torch.constant.int 0 %int2_1312 = torch.constant.int 2 %1572 = torch.aten.select.int %1513, %int0_1311, %int2_1312 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_1313 = torch.constant.int 0 %int2_1314 = torch.constant.int 2 %1573 = torch.aten.select.int %arg3, %int0_1313, %int2_1314 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_1315 = torch.constant.int 0 %int0_1316 = torch.constant.int 0 %int9223372036854775807_1317 = torch.constant.int 9223372036854775807 %int1_1318 = torch.constant.int 1 %1574 = torch.aten.slice.Tensor %1573, %int0_1315, %int0_1316, %int9223372036854775807_1317, %int1_1318 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_1319 = torch.constant.int 16 %1575 = torch.aten.floor_divide.Scalar %1572, %int16_1319 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_1320 = torch.constant.int 0 %1576 = torch.aten.index_select %1574, %int0_1320, %1575 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_1321 = torch.constant.int 16 %1577 = torch.aten.remainder.Scalar %1572, %int16_1321 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_1322 = torch.constant.none %1578 = torch.aten.clone %294, %none_1322 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1323 = torch.constant.none %1579 = torch.aten.clone %295, %none_1323 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1324 = torch.constant.int 0 %1580 = torch.aten.unsqueeze %1577, %int0_1324 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1325 = torch.constant.int 0 %int2_1326 = torch.constant.int 2 %1581 = torch.aten.select.int %1512, %int0_1325, %int2_1326 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1327 = torch.constant.int 0 %int0_1328 = torch.constant.int 0 %1582 = torch.aten.select.int %1581, %int0_1327, %int0_1328 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1583 = torch.prim.ListConstruct %1576, %1578, %1579, %1580 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1329 = torch.constant.bool false %1584 = torch.aten.index_put %1571, %1583, %1582, %false_1329 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1330 = torch.constant.int 2662400 %1585 = torch.prim.ListConstruct %731, %int2662400_1330 : (!torch.int, !torch.int) -> !torch.list %1586 = torch.aten.view %1584, %1585 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1331 = torch.constant.int -1 %int26_1332 = torch.constant.int 26 %int2_1333 = torch.constant.int 2 %int16_1334 = torch.constant.int 16 %int32_1335 = torch.constant.int 32 %int100_1336 = torch.constant.int 100 %1587 = torch.prim.ListConstruct %int-1_1331, %int26_1332, %int2_1333, %int16_1334, %int32_1335, %int100_1336 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1588 = torch.aten.view %1586, %1587 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_1337 = torch.constant.none %1589 = torch.aten.clone %296, %none_1337 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1338 = torch.constant.none %1590 = torch.aten.clone %297, %none_1338 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1339 = torch.constant.int 0 %1591 = torch.aten.unsqueeze %1577, %int0_1339 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1340 = torch.constant.int 0 %int2_1341 = torch.constant.int 2 %1592 = torch.aten.select.int %1498, %int0_1340, %int2_1341 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1342 = torch.constant.int 0 %int0_1343 = torch.constant.int 0 %1593 = torch.aten.select.int %1592, %int0_1342, %int0_1343 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1594 = torch.prim.ListConstruct %1576, %1589, %1590, %1591 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1344 = torch.constant.bool false %1595 = torch.aten.index_put %1588, %1594, %1593, %false_1344 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1345 = torch.constant.int 2662400 %1596 = torch.prim.ListConstruct %731, %int2662400_1345 : (!torch.int, !torch.int) -> !torch.list %1597 = torch.aten.view %1595, %1596 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1346 = torch.constant.int -1 %int26_1347 = torch.constant.int 26 %int2_1348 = torch.constant.int 2 %int16_1349 = torch.constant.int 16 %int32_1350 = torch.constant.int 32 %int100_1351 = torch.constant.int 100 %1598 = torch.prim.ListConstruct %int-1_1346, %int26_1347, %int2_1348, %int16_1349, %int32_1350, %int100_1351 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1599 = torch.aten.view %1597, %1598 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_1352 = torch.constant.int 0 %int3_1353 = torch.constant.int 3 %1600 = torch.aten.select.int %1513, %int0_1352, %int3_1353 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_1354 = torch.constant.int 0 %int3_1355 = torch.constant.int 3 %1601 = torch.aten.select.int %arg3, %int0_1354, %int3_1355 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_1356 = torch.constant.int 0 %int0_1357 = torch.constant.int 0 %int9223372036854775807_1358 = torch.constant.int 9223372036854775807 %int1_1359 = torch.constant.int 1 %1602 = torch.aten.slice.Tensor %1601, %int0_1356, %int0_1357, %int9223372036854775807_1358, %int1_1359 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_1360 = torch.constant.int 16 %1603 = torch.aten.floor_divide.Scalar %1600, %int16_1360 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_1361 = torch.constant.int 0 %1604 = torch.aten.index_select %1602, %int0_1361, %1603 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_1362 = torch.constant.int 16 %1605 = torch.aten.remainder.Scalar %1600, %int16_1362 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_1363 = torch.constant.none %1606 = torch.aten.clone %298, %none_1363 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1364 = torch.constant.none %1607 = torch.aten.clone %299, %none_1364 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1365 = torch.constant.int 0 %1608 = torch.aten.unsqueeze %1605, %int0_1365 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1366 = torch.constant.int 0 %int3_1367 = torch.constant.int 3 %1609 = torch.aten.select.int %1512, %int0_1366, %int3_1367 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1368 = torch.constant.int 0 %int0_1369 = torch.constant.int 0 %1610 = torch.aten.select.int %1609, %int0_1368, %int0_1369 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1611 = torch.prim.ListConstruct %1604, %1606, %1607, %1608 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1370 = torch.constant.bool false %1612 = torch.aten.index_put %1599, %1611, %1610, %false_1370 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1371 = torch.constant.int 2662400 %1613 = torch.prim.ListConstruct %731, %int2662400_1371 : (!torch.int, !torch.int) -> !torch.list %1614 = torch.aten.view %1612, %1613 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1372 = torch.constant.int -1 %int26_1373 = torch.constant.int 26 %int2_1374 = torch.constant.int 2 %int16_1375 = torch.constant.int 16 %int32_1376 = torch.constant.int 32 %int100_1377 = torch.constant.int 100 %1615 = torch.prim.ListConstruct %int-1_1372, %int26_1373, %int2_1374, %int16_1375, %int32_1376, %int100_1377 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1616 = torch.aten.view %1614, %1615 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_1378 = torch.constant.none %1617 = torch.aten.clone %300, %none_1378 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1379 = torch.constant.none %1618 = torch.aten.clone %301, %none_1379 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1380 = torch.constant.int 0 %1619 = torch.aten.unsqueeze %1605, %int0_1380 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1381 = torch.constant.int 0 %int3_1382 = torch.constant.int 3 %1620 = torch.aten.select.int %1498, %int0_1381, %int3_1382 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1383 = torch.constant.int 0 %int0_1384 = torch.constant.int 0 %1621 = torch.aten.select.int %1620, %int0_1383, %int0_1384 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1622 = torch.prim.ListConstruct %1604, %1617, %1618, %1619 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1385 = torch.constant.bool false %1623 = torch.aten.index_put %1616, %1622, %1621, %false_1385 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1386 = torch.constant.int 2662400 %1624 = torch.prim.ListConstruct %731, %int2662400_1386 : (!torch.int, !torch.int) -> !torch.list %1625 = torch.aten.view %1623, %1624 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_1387 = torch.constant.int 52 %1626 = torch.aten.mul.Scalar %arg3, %int52_1387 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int6_1388 = torch.constant.int 6 %int1_1389 = torch.constant.int 1 %1627 = torch.aten.add.Scalar %1626, %int6_1388, %int1_1389 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_1390 = torch.constant.int 4 %1628 = torch.aten.mul.int %int4_1390, %655 : !torch.int, !torch.int -> !torch.int %1629 = torch.prim.ListConstruct %1628 : (!torch.int) -> !torch.list %1630 = torch.aten.view %1627, %1629 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_1391 = torch.constant.int -1 %int26_1392 = torch.constant.int 26 %int2_1393 = torch.constant.int 2 %int16_1394 = torch.constant.int 16 %int32_1395 = torch.constant.int 32 %int100_1396 = torch.constant.int 100 %1631 = torch.prim.ListConstruct %int-1_1391, %int26_1392, %int2_1393, %int16_1394, %int32_1395, %int100_1396 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1632 = torch.aten.view %1625, %1631 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_1397 = torch.constant.int 26 %1633 = torch.aten.mul.int %731, %int26_1397 : !torch.int, !torch.int -> !torch.int %int2_1398 = torch.constant.int 2 %1634 = torch.aten.mul.int %1633, %int2_1398 : !torch.int, !torch.int -> !torch.int %int16_1399 = torch.constant.int 16 %int32_1400 = torch.constant.int 32 %int100_1401 = torch.constant.int 100 %1635 = torch.prim.ListConstruct %1634, %int16_1399, %int32_1400, %int100_1401 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1636 = torch.aten.view %1632, %1635 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_1402 = torch.constant.int 0 %1637 = torch.aten.index_select %1636, %int0_1402, %1630 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_1403 = torch.constant.int 4 %int16_1404 = torch.constant.int 16 %int32_1405 = torch.constant.int 32 %int100_1406 = torch.constant.int 100 %1638 = torch.prim.ListConstruct %int4_1403, %655, %int16_1404, %int32_1405, %int100_1406 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1639 = torch.aten.view %1637, %1638 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_1407 = torch.constant.int 1 %1640 = torch.aten.size.int %1639, %int1_1407 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_1408 = torch.constant.int 16 %1641 = torch.aten.mul.int %1640, %int16_1408 : !torch.int, !torch.int -> !torch.int %int4_1409 = torch.constant.int 4 %int32_1410 = torch.constant.int 32 %int100_1411 = torch.constant.int 100 %1642 = torch.prim.ListConstruct %int4_1409, %1641, %int32_1410, %int100_1411 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1643 = torch.aten.view %1639, %1642 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_1412 = torch.constant.int 0 %int0_1413 = torch.constant.int 0 %int9223372036854775807_1414 = torch.constant.int 9223372036854775807 %int1_1415 = torch.constant.int 1 %1644 = torch.aten.slice.Tensor %1385, %int0_1412, %int0_1413, %int9223372036854775807_1414, %int1_1415 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_1416 = torch.constant.int 16 %1645 = torch.aten.mul.int %655, %int16_1416 : !torch.int, !torch.int -> !torch.int %int1_1417 = torch.constant.int 1 %int0_1418 = torch.constant.int 0 %int1_1419 = torch.constant.int 1 %1646 = torch.aten.slice.Tensor %1644, %int1_1417, %int0_1418, %1645, %int1_1419 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_1420 = torch.constant.bool false %1647 = torch.aten.copy %1646, %1643, %false_1420 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_1421 = torch.constant.int 0 %int0_1422 = torch.constant.int 0 %int9223372036854775807_1423 = torch.constant.int 9223372036854775807 %int1_1424 = torch.constant.int 1 %1648 = torch.aten.slice.Tensor %1385, %int0_1421, %int0_1422, %int9223372036854775807_1423, %int1_1424 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1425 = torch.constant.int 1 %int0_1426 = torch.constant.int 0 %int1_1427 = torch.constant.int 1 %1649 = torch.aten.slice_scatter %1648, %1647, %int1_1425, %int0_1426, %1645, %int1_1427 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_1428 = torch.constant.int 0 %int0_1429 = torch.constant.int 0 %int9223372036854775807_1430 = torch.constant.int 9223372036854775807 %int1_1431 = torch.constant.int 1 %1650 = torch.aten.slice_scatter %1385, %1649, %int0_1428, %int0_1429, %int9223372036854775807_1430, %int1_1431 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1432 = torch.constant.int 1 %int1_1433 = torch.constant.int 1 %1651 = torch.aten.add.Scalar %1627, %int1_1432, %int1_1433 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_1434 = torch.constant.int 4 %1652 = torch.aten.mul.int %int4_1434, %655 : !torch.int, !torch.int -> !torch.int %1653 = torch.prim.ListConstruct %1652 : (!torch.int) -> !torch.list %1654 = torch.aten.view %1651, %1653 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_1435 = torch.constant.int 0 %1655 = torch.aten.index_select %1636, %int0_1435, %1654 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_1436 = torch.constant.int 4 %int16_1437 = torch.constant.int 16 %int32_1438 = torch.constant.int 32 %int100_1439 = torch.constant.int 100 %1656 = torch.prim.ListConstruct %int4_1436, %655, %int16_1437, %int32_1438, %int100_1439 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1657 = torch.aten.view %1655, %1656 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_1440 = torch.constant.int 1 %1658 = torch.aten.size.int %1657, %int1_1440 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_1441 = torch.constant.int 16 %1659 = torch.aten.mul.int %1658, %int16_1441 : !torch.int, !torch.int -> !torch.int %int4_1442 = torch.constant.int 4 %int32_1443 = torch.constant.int 32 %int100_1444 = torch.constant.int 100 %1660 = torch.prim.ListConstruct %int4_1442, %1659, %int32_1443, %int100_1444 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1661 = torch.aten.view %1657, %1660 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_1445 = torch.constant.int 0 %int0_1446 = torch.constant.int 0 %int9223372036854775807_1447 = torch.constant.int 9223372036854775807 %int1_1448 = torch.constant.int 1 %1662 = torch.aten.slice.Tensor %1402, %int0_1445, %int0_1446, %int9223372036854775807_1447, %int1_1448 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1449 = torch.constant.int 1 %int0_1450 = torch.constant.int 0 %int1_1451 = torch.constant.int 1 %1663 = torch.aten.slice.Tensor %1662, %int1_1449, %int0_1450, %1645, %int1_1451 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_1452 = torch.constant.bool false %1664 = torch.aten.copy %1663, %1661, %false_1452 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_1453 = torch.constant.int 0 %int0_1454 = torch.constant.int 0 %int9223372036854775807_1455 = torch.constant.int 9223372036854775807 %int1_1456 = torch.constant.int 1 %1665 = torch.aten.slice.Tensor %1402, %int0_1453, %int0_1454, %int9223372036854775807_1455, %int1_1456 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1457 = torch.constant.int 1 %int0_1458 = torch.constant.int 0 %int1_1459 = torch.constant.int 1 %1666 = torch.aten.slice_scatter %1665, %1664, %int1_1457, %int0_1458, %1645, %int1_1459 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_1460 = torch.constant.int 0 %int0_1461 = torch.constant.int 0 %int9223372036854775807_1462 = torch.constant.int 9223372036854775807 %int1_1463 = torch.constant.int 1 %1667 = torch.aten.slice_scatter %1402, %1666, %int0_1460, %int0_1461, %int9223372036854775807_1462, %int1_1463 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_1464 = torch.constant.int 0 %int0_1465 = torch.constant.int 0 %int9223372036854775807_1466 = torch.constant.int 9223372036854775807 %int1_1467 = torch.constant.int 1 %1668 = torch.aten.slice.Tensor %671, %int0_1464, %int0_1465, %int9223372036854775807_1466, %int1_1467 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1468 = torch.constant.int 1 %int0_1469 = torch.constant.int 0 %int1_1470 = torch.constant.int 1 %1669 = torch.aten.slice.Tensor %1668, %int1_1468, %int0_1469, %1645, %int1_1470 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_1471 = torch.constant.int 0 %int0_1472 = torch.constant.int 0 %int9223372036854775807_1473 = torch.constant.int 9223372036854775807 %int1_1474 = torch.constant.int 1 %1670 = torch.aten.slice.Tensor %673, %int0_1471, %int0_1472, %int9223372036854775807_1473, %int1_1474 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1475 = torch.constant.int 1 %int0_1476 = torch.constant.int 0 %int1_1477 = torch.constant.int 1 %1671 = torch.aten.slice.Tensor %1670, %int1_1475, %int0_1476, %1645, %int1_1477 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_1478 = torch.constant.int 1 %int2_1479 = torch.constant.int 2 %1672 = torch.aten.transpose.int %1508, %int1_1478, %int2_1479 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_1480 = torch.constant.int 4 %int32_1481 = torch.constant.int 32 %int1_1482 = torch.constant.int 1 %int100_1483 = torch.constant.int 100 %1673 = torch.prim.ListConstruct %int4_1480, %int32_1481, %int1_1482, %int100_1483 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1484 = torch.constant.bool false %1674 = torch.aten.expand %1672, %1673, %false_1484 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_1485 = torch.constant.int 128 %int1_1486 = torch.constant.int 1 %int100_1487 = torch.constant.int 100 %1675 = torch.prim.ListConstruct %int128_1485, %int1_1486, %int100_1487 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1676 = torch.aten.view %1674, %1675 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_1488 = torch.constant.int 0 %int0_1489 = torch.constant.int 0 %int9223372036854775807_1490 = torch.constant.int 9223372036854775807 %int1_1491 = torch.constant.int 1 %1677 = torch.aten.slice.Tensor %1650, %int0_1488, %int0_1489, %int9223372036854775807_1490, %int1_1491 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1492 = torch.constant.int 1 %int0_1493 = torch.constant.int 0 %int1_1494 = torch.constant.int 1 %1678 = torch.aten.slice.Tensor %1677, %int1_1492, %int0_1493, %1645, %int1_1494 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_1495 = torch.constant.int 1 %int2_1496 = torch.constant.int 2 %1679 = torch.aten.transpose.int %1678, %int1_1495, %int2_1496 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_1497 = torch.constant.int 2 %int3_1498 = torch.constant.int 3 %1680 = torch.aten.transpose.int %1679, %int2_1497, %int3_1498 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_1499 = torch.constant.int 1 %1681 = torch.aten.size.int %1669, %int1_1499 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_1500 = torch.constant.int 4 %int32_1501 = torch.constant.int 32 %int100_1502 = torch.constant.int 100 %1682 = torch.prim.ListConstruct %int4_1500, %int32_1501, %int100_1502, %1681 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1503 = torch.constant.bool false %1683 = torch.aten.expand %1680, %1682, %false_1503 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_1504 = torch.constant.int 0 %1684 = torch.aten.clone %1683, %int0_1504 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_1505 = torch.constant.int 128 %int100_1506 = torch.constant.int 100 %1685 = torch.prim.ListConstruct %int128_1505, %int100_1506, %1681 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1686 = torch.aten._unsafe_view %1684, %1685 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %1687 = torch.aten.bmm %1676, %1686 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_1507 = torch.constant.int 4 %int32_1508 = torch.constant.int 32 %int1_1509 = torch.constant.int 1 %1688 = torch.prim.ListConstruct %int4_1507, %int32_1508, %int1_1509, %1681 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1689 = torch.aten.view %1687, %1688 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_1510 = torch.constant.float 1.000000e+01 %1690 = torch.aten.div.Scalar %1689, %float1.000000e01_1510 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_1511 = torch.constant.int 1 %1691 = torch.aten.add.Tensor %1690, %895, %int1_1511 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_1512 = torch.constant.int -1 %false_1513 = torch.constant.bool false %1692 = torch.aten._softmax %1691, %int-1_1512, %false_1513 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_1514 = torch.constant.int 4 %int32_1515 = torch.constant.int 32 %int1_1516 = torch.constant.int 1 %1693 = torch.prim.ListConstruct %int4_1514, %int32_1515, %int1_1516, %1681 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1517 = torch.constant.bool false %1694 = torch.aten.expand %1692, %1693, %false_1517 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_1518 = torch.constant.int 128 %int1_1519 = torch.constant.int 1 %1695 = torch.prim.ListConstruct %int128_1518, %int1_1519, %1681 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1696 = torch.aten.view %1694, %1695 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_1520 = torch.constant.int 0 %int0_1521 = torch.constant.int 0 %int9223372036854775807_1522 = torch.constant.int 9223372036854775807 %int1_1523 = torch.constant.int 1 %1697 = torch.aten.slice.Tensor %1667, %int0_1520, %int0_1521, %int9223372036854775807_1522, %int1_1523 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1524 = torch.constant.int 1 %int0_1525 = torch.constant.int 0 %int1_1526 = torch.constant.int 1 %1698 = torch.aten.slice.Tensor %1697, %int1_1524, %int0_1525, %1645, %int1_1526 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_1527 = torch.constant.int 1 %int2_1528 = torch.constant.int 2 %1699 = torch.aten.transpose.int %1698, %int1_1527, %int2_1528 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_1529 = torch.constant.int 1 %1700 = torch.aten.size.int %1671, %int1_1529 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_1530 = torch.constant.int 4 %int32_1531 = torch.constant.int 32 %int100_1532 = torch.constant.int 100 %1701 = torch.prim.ListConstruct %int4_1530, %int32_1531, %1700, %int100_1532 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1533 = torch.constant.bool false %1702 = torch.aten.expand %1699, %1701, %false_1533 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_1534 = torch.constant.int 0 %1703 = torch.aten.clone %1702, %int0_1534 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_1535 = torch.constant.int 128 %int100_1536 = torch.constant.int 100 %1704 = torch.prim.ListConstruct %int128_1535, %1700, %int100_1536 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1705 = torch.aten._unsafe_view %1703, %1704 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %1706 = torch.aten.bmm %1696, %1705 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_1537 = torch.constant.int 4 %int32_1538 = torch.constant.int 32 %int1_1539 = torch.constant.int 1 %int100_1540 = torch.constant.int 100 %1707 = torch.prim.ListConstruct %int4_1537, %int32_1538, %int1_1539, %int100_1540 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1708 = torch.aten.view %1706, %1707 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_1541 = torch.constant.int 1 %int2_1542 = torch.constant.int 2 %1709 = torch.aten.transpose.int %1708, %int1_1541, %int2_1542 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_1543 = torch.constant.int 4 %int1_1544 = torch.constant.int 1 %int-1_1545 = torch.constant.int -1 %1710 = torch.prim.ListConstruct %int4_1543, %int1_1544, %int-1_1545 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1711 = torch.aten.view %1709, %1710 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %1712 = torch_c.to_builtin_tensor %1711 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1546 = tensor.cast %1712 : tensor<4x1x3200xf32> to tensor %1713 = torch_c.to_builtin_tensor %33 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1714 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1546, %1713) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1547 = tensor.cast %1714 : tensor to tensor<4x1x3200xf32> %1715 = torch_c.from_builtin_tensor %cast_1547 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_1548 = torch.constant.int 1 %1716 = torch.aten.add.Tensor %1473, %1715, %int1_1548 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_1549 = torch.constant.int 2 %1717 = torch.aten.pow.Tensor_Scalar %1716, %int2_1549 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_1550 = torch.constant.int -1 %1718 = torch.prim.ListConstruct %int-1_1550 : (!torch.int) -> !torch.list %true_1551 = torch.constant.bool true %none_1552 = torch.constant.none %1719 = torch.aten.mean.dim %1717, %1718, %true_1551, %none_1552 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_1553 = torch.constant.float 9.9999999747524271E-7 %int1_1554 = torch.constant.int 1 %1720 = torch.aten.add.Scalar %1719, %float9.999990e-07_1553, %int1_1554 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %1721 = torch.aten.rsqrt %1720 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %1722 = torch.aten.mul.Tensor %1716, %1721 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %1723 = torch.aten.mul.Tensor %1722, %34 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %1724 = torch_c.to_builtin_tensor %1723 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1555 = tensor.cast %1724 : tensor<4x1x3200xf32> to tensor %1725 = torch_c.to_builtin_tensor %35 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %1726 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_1555, %1725) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_1556 = tensor.cast %1726 : tensor to tensor<4x1x8640xf32> %1727 = torch_c.from_builtin_tensor %cast_1556 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %1728 = torch.aten.silu %1727 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %1729 = torch_c.to_builtin_tensor %1723 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1557 = tensor.cast %1729 : tensor<4x1x3200xf32> to tensor %1730 = torch_c.to_builtin_tensor %36 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %1731 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_1557, %1730) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_1558 = tensor.cast %1731 : tensor to tensor<4x1x8640xf32> %1732 = torch_c.from_builtin_tensor %cast_1558 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %1733 = torch.aten.mul.Tensor %1728, %1732 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %1734 = torch_c.to_builtin_tensor %1733 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_1559 = tensor.cast %1734 : tensor<4x1x8640xf32> to tensor %1735 = torch_c.to_builtin_tensor %37 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %1736 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_1559, %1735) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_1560 = tensor.cast %1736 : tensor to tensor<4x1x3200xf32> %1737 = torch_c.from_builtin_tensor %cast_1560 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_1561 = torch.constant.int 1 %1738 = torch.aten.add.Tensor %1716, %1737, %int1_1561 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_1562 = torch.constant.int 2 %1739 = torch.aten.pow.Tensor_Scalar %1738, %int2_1562 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_1563 = torch.constant.int -1 %1740 = torch.prim.ListConstruct %int-1_1563 : (!torch.int) -> !torch.list %true_1564 = torch.constant.bool true %none_1565 = torch.constant.none %1741 = torch.aten.mean.dim %1739, %1740, %true_1564, %none_1565 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_1566 = torch.constant.float 9.9999999747524271E-7 %int1_1567 = torch.constant.int 1 %1742 = torch.aten.add.Scalar %1741, %float9.999990e-07_1566, %int1_1567 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %1743 = torch.aten.rsqrt %1742 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %1744 = torch.aten.mul.Tensor %1738, %1743 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %1745 = torch.aten.mul.Tensor %1744, %38 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %1746 = torch_c.to_builtin_tensor %1745 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1568 = tensor.cast %1746 : tensor<4x1x3200xf32> to tensor %1747 = torch_c.to_builtin_tensor %39 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1748 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1568, %1747) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1569 = tensor.cast %1748 : tensor to tensor<4x1x3200xf32> %1749 = torch_c.from_builtin_tensor %cast_1569 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %1750 = torch_c.to_builtin_tensor %1745 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1570 = tensor.cast %1750 : tensor<4x1x3200xf32> to tensor %1751 = torch_c.to_builtin_tensor %40 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1752 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1570, %1751) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1571 = tensor.cast %1752 : tensor to tensor<4x1x3200xf32> %1753 = torch_c.from_builtin_tensor %cast_1571 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %1754 = torch_c.to_builtin_tensor %1745 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1572 = tensor.cast %1754 : tensor<4x1x3200xf32> to tensor %1755 = torch_c.to_builtin_tensor %41 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1756 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1572, %1755) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1573 = tensor.cast %1756 : tensor to tensor<4x1x3200xf32> %1757 = torch_c.from_builtin_tensor %cast_1573 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_1574 = torch.constant.int 4 %int1_1575 = torch.constant.int 1 %int32_1576 = torch.constant.int 32 %int100_1577 = torch.constant.int 100 %1758 = torch.prim.ListConstruct %int4_1574, %int1_1575, %int32_1576, %int100_1577 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1759 = torch.aten.view %1749, %1758 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_1578 = torch.constant.int 4 %int1_1579 = torch.constant.int 1 %int32_1580 = torch.constant.int 32 %int100_1581 = torch.constant.int 100 %1760 = torch.prim.ListConstruct %int4_1578, %int1_1579, %int32_1580, %int100_1581 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1761 = torch.aten.view %1753, %1760 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_1582 = torch.constant.int 4 %int1_1583 = torch.constant.int 1 %int32_1584 = torch.constant.int 32 %int100_1585 = torch.constant.int 100 %1762 = torch.prim.ListConstruct %int4_1582, %int1_1583, %int32_1584, %int100_1585 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1763 = torch.aten.view %1757, %1762 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_1586 = torch.constant.int 4 %int1_1587 = torch.constant.int 1 %int32_1588 = torch.constant.int 32 %int-1_1589 = torch.constant.int -1 %int2_1590 = torch.constant.int 2 %1764 = torch.prim.ListConstruct %int4_1586, %int1_1587, %int32_1588, %int-1_1589, %int2_1590 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1765 = torch.aten.view %1759, %1764 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %1766 = torch.aten.view_as_complex %1765 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_1591 = torch.constant.int 4 %int1_1592 = torch.constant.int 1 %int32_1593 = torch.constant.int 32 %int-1_1594 = torch.constant.int -1 %int2_1595 = torch.constant.int 2 %1767 = torch.prim.ListConstruct %int4_1591, %int1_1592, %int32_1593, %int-1_1594, %int2_1595 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1768 = torch.aten.view %1761, %1767 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %1769 = torch.aten.view_as_complex %1768 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %1770 = torch.aten.mul.Tensor %1766, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %1771 = torch.aten.view_as_real %1770 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_1596 = torch.constant.int 4 %int1_1597 = torch.constant.int 1 %int32_1598 = torch.constant.int 32 %int100_1599 = torch.constant.int 100 %1772 = torch.prim.ListConstruct %int4_1596, %int1_1597, %int32_1598, %int100_1599 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1773 = torch.aten.view %1771, %1772 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %1774 = torch.aten.mul.Tensor %1769, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %1775 = torch.aten.view_as_real %1774 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_1600 = torch.constant.int 4 %int1_1601 = torch.constant.int 1 %int32_1602 = torch.constant.int 32 %int100_1603 = torch.constant.int 100 %1776 = torch.prim.ListConstruct %int4_1600, %int1_1601, %int32_1602, %int100_1603 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1777 = torch.aten.view %1775, %1776 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_1604 = torch.constant.int 1 %int1_1605 = torch.constant.int 1 %1778 = torch.aten.add.Scalar %arg2, %int1_1604, %int1_1605 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_1606 = torch.constant.int 0 %int0_1607 = torch.constant.int 0 %1779 = torch.aten.select.int %1778, %int0_1606, %int0_1607 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_1608 = torch.constant.int 0 %int0_1609 = torch.constant.int 0 %1780 = torch.aten.select.int %arg3, %int0_1608, %int0_1609 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_1610 = torch.constant.int 0 %int0_1611 = torch.constant.int 0 %int9223372036854775807_1612 = torch.constant.int 9223372036854775807 %int1_1613 = torch.constant.int 1 %1781 = torch.aten.slice.Tensor %1780, %int0_1610, %int0_1611, %int9223372036854775807_1612, %int1_1613 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_1614 = torch.constant.int 16 %1782 = torch.aten.floor_divide.Scalar %1779, %int16_1614 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_1615 = torch.constant.int 0 %1783 = torch.aten.index_select %1781, %int0_1615, %1782 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_1616 = torch.constant.int 16 %1784 = torch.aten.remainder.Scalar %1779, %int16_1616 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_1617 = torch.constant.none %1785 = torch.aten.clone %302, %none_1617 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1618 = torch.constant.none %1786 = torch.aten.clone %303, %none_1618 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1619 = torch.constant.int 0 %1787 = torch.aten.unsqueeze %1784, %int0_1619 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1620 = torch.constant.int 0 %int0_1621 = torch.constant.int 0 %1788 = torch.aten.select.int %1777, %int0_1620, %int0_1621 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1622 = torch.constant.int 0 %int0_1623 = torch.constant.int 0 %1789 = torch.aten.select.int %1788, %int0_1622, %int0_1623 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_1624 = torch.constant.int -1 %int26_1625 = torch.constant.int 26 %int2_1626 = torch.constant.int 2 %int16_1627 = torch.constant.int 16 %int32_1628 = torch.constant.int 32 %int100_1629 = torch.constant.int 100 %1790 = torch.prim.ListConstruct %int-1_1624, %int26_1625, %int2_1626, %int16_1627, %int32_1628, %int100_1629 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1791 = torch.aten.view %1625, %1790 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %1792 = torch.prim.ListConstruct %1783, %1785, %1786, %1787 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1630 = torch.constant.bool false %1793 = torch.aten.index_put %1791, %1792, %1789, %false_1630 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1631 = torch.constant.int 2662400 %1794 = torch.prim.ListConstruct %731, %int2662400_1631 : (!torch.int, !torch.int) -> !torch.list %1795 = torch.aten.view %1793, %1794 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1632 = torch.constant.int -1 %int26_1633 = torch.constant.int 26 %int2_1634 = torch.constant.int 2 %int16_1635 = torch.constant.int 16 %int32_1636 = torch.constant.int 32 %int100_1637 = torch.constant.int 100 %1796 = torch.prim.ListConstruct %int-1_1632, %int26_1633, %int2_1634, %int16_1635, %int32_1636, %int100_1637 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1797 = torch.aten.view %1795, %1796 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_1638 = torch.constant.none %1798 = torch.aten.clone %304, %none_1638 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1639 = torch.constant.none %1799 = torch.aten.clone %305, %none_1639 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1640 = torch.constant.int 0 %1800 = torch.aten.unsqueeze %1784, %int0_1640 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1641 = torch.constant.int 0 %int0_1642 = torch.constant.int 0 %1801 = torch.aten.select.int %1763, %int0_1641, %int0_1642 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1643 = torch.constant.int 0 %int0_1644 = torch.constant.int 0 %1802 = torch.aten.select.int %1801, %int0_1643, %int0_1644 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1803 = torch.prim.ListConstruct %1783, %1798, %1799, %1800 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1645 = torch.constant.bool false %1804 = torch.aten.index_put %1797, %1803, %1802, %false_1645 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1646 = torch.constant.int 2662400 %1805 = torch.prim.ListConstruct %731, %int2662400_1646 : (!torch.int, !torch.int) -> !torch.list %1806 = torch.aten.view %1804, %1805 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1647 = torch.constant.int -1 %int26_1648 = torch.constant.int 26 %int2_1649 = torch.constant.int 2 %int16_1650 = torch.constant.int 16 %int32_1651 = torch.constant.int 32 %int100_1652 = torch.constant.int 100 %1807 = torch.prim.ListConstruct %int-1_1647, %int26_1648, %int2_1649, %int16_1650, %int32_1651, %int100_1652 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1808 = torch.aten.view %1806, %1807 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_1653 = torch.constant.int 0 %int1_1654 = torch.constant.int 1 %1809 = torch.aten.select.int %1778, %int0_1653, %int1_1654 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_1655 = torch.constant.int 0 %int1_1656 = torch.constant.int 1 %1810 = torch.aten.select.int %arg3, %int0_1655, %int1_1656 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_1657 = torch.constant.int 0 %int0_1658 = torch.constant.int 0 %int9223372036854775807_1659 = torch.constant.int 9223372036854775807 %int1_1660 = torch.constant.int 1 %1811 = torch.aten.slice.Tensor %1810, %int0_1657, %int0_1658, %int9223372036854775807_1659, %int1_1660 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_1661 = torch.constant.int 16 %1812 = torch.aten.floor_divide.Scalar %1809, %int16_1661 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_1662 = torch.constant.int 0 %1813 = torch.aten.index_select %1811, %int0_1662, %1812 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_1663 = torch.constant.int 16 %1814 = torch.aten.remainder.Scalar %1809, %int16_1663 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_1664 = torch.constant.none %1815 = torch.aten.clone %306, %none_1664 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1665 = torch.constant.none %1816 = torch.aten.clone %307, %none_1665 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1666 = torch.constant.int 0 %1817 = torch.aten.unsqueeze %1814, %int0_1666 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1667 = torch.constant.int 0 %int1_1668 = torch.constant.int 1 %1818 = torch.aten.select.int %1777, %int0_1667, %int1_1668 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1669 = torch.constant.int 0 %int0_1670 = torch.constant.int 0 %1819 = torch.aten.select.int %1818, %int0_1669, %int0_1670 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1820 = torch.prim.ListConstruct %1813, %1815, %1816, %1817 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1671 = torch.constant.bool false %1821 = torch.aten.index_put %1808, %1820, %1819, %false_1671 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1672 = torch.constant.int 2662400 %1822 = torch.prim.ListConstruct %731, %int2662400_1672 : (!torch.int, !torch.int) -> !torch.list %1823 = torch.aten.view %1821, %1822 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1673 = torch.constant.int -1 %int26_1674 = torch.constant.int 26 %int2_1675 = torch.constant.int 2 %int16_1676 = torch.constant.int 16 %int32_1677 = torch.constant.int 32 %int100_1678 = torch.constant.int 100 %1824 = torch.prim.ListConstruct %int-1_1673, %int26_1674, %int2_1675, %int16_1676, %int32_1677, %int100_1678 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1825 = torch.aten.view %1823, %1824 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_1679 = torch.constant.none %1826 = torch.aten.clone %308, %none_1679 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1680 = torch.constant.none %1827 = torch.aten.clone %309, %none_1680 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1681 = torch.constant.int 0 %1828 = torch.aten.unsqueeze %1814, %int0_1681 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1682 = torch.constant.int 0 %int1_1683 = torch.constant.int 1 %1829 = torch.aten.select.int %1763, %int0_1682, %int1_1683 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1684 = torch.constant.int 0 %int0_1685 = torch.constant.int 0 %1830 = torch.aten.select.int %1829, %int0_1684, %int0_1685 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1831 = torch.prim.ListConstruct %1813, %1826, %1827, %1828 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1686 = torch.constant.bool false %1832 = torch.aten.index_put %1825, %1831, %1830, %false_1686 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1687 = torch.constant.int 2662400 %1833 = torch.prim.ListConstruct %731, %int2662400_1687 : (!torch.int, !torch.int) -> !torch.list %1834 = torch.aten.view %1832, %1833 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1688 = torch.constant.int -1 %int26_1689 = torch.constant.int 26 %int2_1690 = torch.constant.int 2 %int16_1691 = torch.constant.int 16 %int32_1692 = torch.constant.int 32 %int100_1693 = torch.constant.int 100 %1835 = torch.prim.ListConstruct %int-1_1688, %int26_1689, %int2_1690, %int16_1691, %int32_1692, %int100_1693 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1836 = torch.aten.view %1834, %1835 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_1694 = torch.constant.int 0 %int2_1695 = torch.constant.int 2 %1837 = torch.aten.select.int %1778, %int0_1694, %int2_1695 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_1696 = torch.constant.int 0 %int2_1697 = torch.constant.int 2 %1838 = torch.aten.select.int %arg3, %int0_1696, %int2_1697 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_1698 = torch.constant.int 0 %int0_1699 = torch.constant.int 0 %int9223372036854775807_1700 = torch.constant.int 9223372036854775807 %int1_1701 = torch.constant.int 1 %1839 = torch.aten.slice.Tensor %1838, %int0_1698, %int0_1699, %int9223372036854775807_1700, %int1_1701 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_1702 = torch.constant.int 16 %1840 = torch.aten.floor_divide.Scalar %1837, %int16_1702 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_1703 = torch.constant.int 0 %1841 = torch.aten.index_select %1839, %int0_1703, %1840 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_1704 = torch.constant.int 16 %1842 = torch.aten.remainder.Scalar %1837, %int16_1704 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_1705 = torch.constant.none %1843 = torch.aten.clone %310, %none_1705 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1706 = torch.constant.none %1844 = torch.aten.clone %311, %none_1706 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1707 = torch.constant.int 0 %1845 = torch.aten.unsqueeze %1842, %int0_1707 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1708 = torch.constant.int 0 %int2_1709 = torch.constant.int 2 %1846 = torch.aten.select.int %1777, %int0_1708, %int2_1709 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1710 = torch.constant.int 0 %int0_1711 = torch.constant.int 0 %1847 = torch.aten.select.int %1846, %int0_1710, %int0_1711 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1848 = torch.prim.ListConstruct %1841, %1843, %1844, %1845 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1712 = torch.constant.bool false %1849 = torch.aten.index_put %1836, %1848, %1847, %false_1712 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1713 = torch.constant.int 2662400 %1850 = torch.prim.ListConstruct %731, %int2662400_1713 : (!torch.int, !torch.int) -> !torch.list %1851 = torch.aten.view %1849, %1850 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1714 = torch.constant.int -1 %int26_1715 = torch.constant.int 26 %int2_1716 = torch.constant.int 2 %int16_1717 = torch.constant.int 16 %int32_1718 = torch.constant.int 32 %int100_1719 = torch.constant.int 100 %1852 = torch.prim.ListConstruct %int-1_1714, %int26_1715, %int2_1716, %int16_1717, %int32_1718, %int100_1719 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1853 = torch.aten.view %1851, %1852 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_1720 = torch.constant.none %1854 = torch.aten.clone %312, %none_1720 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1721 = torch.constant.none %1855 = torch.aten.clone %313, %none_1721 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1722 = torch.constant.int 0 %1856 = torch.aten.unsqueeze %1842, %int0_1722 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1723 = torch.constant.int 0 %int2_1724 = torch.constant.int 2 %1857 = torch.aten.select.int %1763, %int0_1723, %int2_1724 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1725 = torch.constant.int 0 %int0_1726 = torch.constant.int 0 %1858 = torch.aten.select.int %1857, %int0_1725, %int0_1726 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1859 = torch.prim.ListConstruct %1841, %1854, %1855, %1856 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1727 = torch.constant.bool false %1860 = torch.aten.index_put %1853, %1859, %1858, %false_1727 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1728 = torch.constant.int 2662400 %1861 = torch.prim.ListConstruct %731, %int2662400_1728 : (!torch.int, !torch.int) -> !torch.list %1862 = torch.aten.view %1860, %1861 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1729 = torch.constant.int -1 %int26_1730 = torch.constant.int 26 %int2_1731 = torch.constant.int 2 %int16_1732 = torch.constant.int 16 %int32_1733 = torch.constant.int 32 %int100_1734 = torch.constant.int 100 %1863 = torch.prim.ListConstruct %int-1_1729, %int26_1730, %int2_1731, %int16_1732, %int32_1733, %int100_1734 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1864 = torch.aten.view %1862, %1863 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_1735 = torch.constant.int 0 %int3_1736 = torch.constant.int 3 %1865 = torch.aten.select.int %1778, %int0_1735, %int3_1736 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_1737 = torch.constant.int 0 %int3_1738 = torch.constant.int 3 %1866 = torch.aten.select.int %arg3, %int0_1737, %int3_1738 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_1739 = torch.constant.int 0 %int0_1740 = torch.constant.int 0 %int9223372036854775807_1741 = torch.constant.int 9223372036854775807 %int1_1742 = torch.constant.int 1 %1867 = torch.aten.slice.Tensor %1866, %int0_1739, %int0_1740, %int9223372036854775807_1741, %int1_1742 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_1743 = torch.constant.int 16 %1868 = torch.aten.floor_divide.Scalar %1865, %int16_1743 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_1744 = torch.constant.int 0 %1869 = torch.aten.index_select %1867, %int0_1744, %1868 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_1745 = torch.constant.int 16 %1870 = torch.aten.remainder.Scalar %1865, %int16_1745 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_1746 = torch.constant.none %1871 = torch.aten.clone %314, %none_1746 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1747 = torch.constant.none %1872 = torch.aten.clone %315, %none_1747 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1748 = torch.constant.int 0 %1873 = torch.aten.unsqueeze %1870, %int0_1748 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1749 = torch.constant.int 0 %int3_1750 = torch.constant.int 3 %1874 = torch.aten.select.int %1777, %int0_1749, %int3_1750 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1751 = torch.constant.int 0 %int0_1752 = torch.constant.int 0 %1875 = torch.aten.select.int %1874, %int0_1751, %int0_1752 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1876 = torch.prim.ListConstruct %1869, %1871, %1872, %1873 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1753 = torch.constant.bool false %1877 = torch.aten.index_put %1864, %1876, %1875, %false_1753 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1754 = torch.constant.int 2662400 %1878 = torch.prim.ListConstruct %731, %int2662400_1754 : (!torch.int, !torch.int) -> !torch.list %1879 = torch.aten.view %1877, %1878 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_1755 = torch.constant.int -1 %int26_1756 = torch.constant.int 26 %int2_1757 = torch.constant.int 2 %int16_1758 = torch.constant.int 16 %int32_1759 = torch.constant.int 32 %int100_1760 = torch.constant.int 100 %1880 = torch.prim.ListConstruct %int-1_1755, %int26_1756, %int2_1757, %int16_1758, %int32_1759, %int100_1760 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1881 = torch.aten.view %1879, %1880 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_1761 = torch.constant.none %1882 = torch.aten.clone %316, %none_1761 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_1762 = torch.constant.none %1883 = torch.aten.clone %317, %none_1762 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_1763 = torch.constant.int 0 %1884 = torch.aten.unsqueeze %1870, %int0_1763 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_1764 = torch.constant.int 0 %int3_1765 = torch.constant.int 3 %1885 = torch.aten.select.int %1763, %int0_1764, %int3_1765 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_1766 = torch.constant.int 0 %int0_1767 = torch.constant.int 0 %1886 = torch.aten.select.int %1885, %int0_1766, %int0_1767 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %1887 = torch.prim.ListConstruct %1869, %1882, %1883, %1884 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_1768 = torch.constant.bool false %1888 = torch.aten.index_put %1881, %1887, %1886, %false_1768 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_1769 = torch.constant.int 2662400 %1889 = torch.prim.ListConstruct %731, %int2662400_1769 : (!torch.int, !torch.int) -> !torch.list %1890 = torch.aten.view %1888, %1889 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_1770 = torch.constant.int 52 %1891 = torch.aten.mul.Scalar %arg3, %int52_1770 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int8 = torch.constant.int 8 %int1_1771 = torch.constant.int 1 %1892 = torch.aten.add.Scalar %1891, %int8, %int1_1771 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_1772 = torch.constant.int 4 %1893 = torch.aten.mul.int %int4_1772, %655 : !torch.int, !torch.int -> !torch.int %1894 = torch.prim.ListConstruct %1893 : (!torch.int) -> !torch.list %1895 = torch.aten.view %1892, %1894 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_1773 = torch.constant.int -1 %int26_1774 = torch.constant.int 26 %int2_1775 = torch.constant.int 2 %int16_1776 = torch.constant.int 16 %int32_1777 = torch.constant.int 32 %int100_1778 = torch.constant.int 100 %1896 = torch.prim.ListConstruct %int-1_1773, %int26_1774, %int2_1775, %int16_1776, %int32_1777, %int100_1778 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1897 = torch.aten.view %1890, %1896 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_1779 = torch.constant.int 26 %1898 = torch.aten.mul.int %731, %int26_1779 : !torch.int, !torch.int -> !torch.int %int2_1780 = torch.constant.int 2 %1899 = torch.aten.mul.int %1898, %int2_1780 : !torch.int, !torch.int -> !torch.int %int16_1781 = torch.constant.int 16 %int32_1782 = torch.constant.int 32 %int100_1783 = torch.constant.int 100 %1900 = torch.prim.ListConstruct %1899, %int16_1781, %int32_1782, %int100_1783 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1901 = torch.aten.view %1897, %1900 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_1784 = torch.constant.int 0 %1902 = torch.aten.index_select %1901, %int0_1784, %1895 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_1785 = torch.constant.int 4 %int16_1786 = torch.constant.int 16 %int32_1787 = torch.constant.int 32 %int100_1788 = torch.constant.int 100 %1903 = torch.prim.ListConstruct %int4_1785, %655, %int16_1786, %int32_1787, %int100_1788 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1904 = torch.aten.view %1902, %1903 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_1789 = torch.constant.int 1 %1905 = torch.aten.size.int %1904, %int1_1789 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_1790 = torch.constant.int 16 %1906 = torch.aten.mul.int %1905, %int16_1790 : !torch.int, !torch.int -> !torch.int %int4_1791 = torch.constant.int 4 %int32_1792 = torch.constant.int 32 %int100_1793 = torch.constant.int 100 %1907 = torch.prim.ListConstruct %int4_1791, %1906, %int32_1792, %int100_1793 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1908 = torch.aten.view %1904, %1907 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_1794 = torch.constant.int 0 %int0_1795 = torch.constant.int 0 %int9223372036854775807_1796 = torch.constant.int 9223372036854775807 %int1_1797 = torch.constant.int 1 %1909 = torch.aten.slice.Tensor %1650, %int0_1794, %int0_1795, %int9223372036854775807_1796, %int1_1797 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_1798 = torch.constant.int 16 %1910 = torch.aten.mul.int %655, %int16_1798 : !torch.int, !torch.int -> !torch.int %int1_1799 = torch.constant.int 1 %int0_1800 = torch.constant.int 0 %int1_1801 = torch.constant.int 1 %1911 = torch.aten.slice.Tensor %1909, %int1_1799, %int0_1800, %1910, %int1_1801 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_1802 = torch.constant.bool false %1912 = torch.aten.copy %1911, %1908, %false_1802 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_1803 = torch.constant.int 0 %int0_1804 = torch.constant.int 0 %int9223372036854775807_1805 = torch.constant.int 9223372036854775807 %int1_1806 = torch.constant.int 1 %1913 = torch.aten.slice.Tensor %1650, %int0_1803, %int0_1804, %int9223372036854775807_1805, %int1_1806 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1807 = torch.constant.int 1 %int0_1808 = torch.constant.int 0 %int1_1809 = torch.constant.int 1 %1914 = torch.aten.slice_scatter %1913, %1912, %int1_1807, %int0_1808, %1910, %int1_1809 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_1810 = torch.constant.int 0 %int0_1811 = torch.constant.int 0 %int9223372036854775807_1812 = torch.constant.int 9223372036854775807 %int1_1813 = torch.constant.int 1 %1915 = torch.aten.slice_scatter %1650, %1914, %int0_1810, %int0_1811, %int9223372036854775807_1812, %int1_1813 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1814 = torch.constant.int 1 %int1_1815 = torch.constant.int 1 %1916 = torch.aten.add.Scalar %1892, %int1_1814, %int1_1815 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_1816 = torch.constant.int 4 %1917 = torch.aten.mul.int %int4_1816, %655 : !torch.int, !torch.int -> !torch.int %1918 = torch.prim.ListConstruct %1917 : (!torch.int) -> !torch.list %1919 = torch.aten.view %1916, %1918 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_1817 = torch.constant.int 0 %1920 = torch.aten.index_select %1901, %int0_1817, %1919 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_1818 = torch.constant.int 4 %int16_1819 = torch.constant.int 16 %int32_1820 = torch.constant.int 32 %int100_1821 = torch.constant.int 100 %1921 = torch.prim.ListConstruct %int4_1818, %655, %int16_1819, %int32_1820, %int100_1821 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1922 = torch.aten.view %1920, %1921 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_1822 = torch.constant.int 1 %1923 = torch.aten.size.int %1922, %int1_1822 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_1823 = torch.constant.int 16 %1924 = torch.aten.mul.int %1923, %int16_1823 : !torch.int, !torch.int -> !torch.int %int4_1824 = torch.constant.int 4 %int32_1825 = torch.constant.int 32 %int100_1826 = torch.constant.int 100 %1925 = torch.prim.ListConstruct %int4_1824, %1924, %int32_1825, %int100_1826 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1926 = torch.aten.view %1922, %1925 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_1827 = torch.constant.int 0 %int0_1828 = torch.constant.int 0 %int9223372036854775807_1829 = torch.constant.int 9223372036854775807 %int1_1830 = torch.constant.int 1 %1927 = torch.aten.slice.Tensor %1667, %int0_1827, %int0_1828, %int9223372036854775807_1829, %int1_1830 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1831 = torch.constant.int 1 %int0_1832 = torch.constant.int 0 %int1_1833 = torch.constant.int 1 %1928 = torch.aten.slice.Tensor %1927, %int1_1831, %int0_1832, %1910, %int1_1833 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_1834 = torch.constant.bool false %1929 = torch.aten.copy %1928, %1926, %false_1834 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_1835 = torch.constant.int 0 %int0_1836 = torch.constant.int 0 %int9223372036854775807_1837 = torch.constant.int 9223372036854775807 %int1_1838 = torch.constant.int 1 %1930 = torch.aten.slice.Tensor %1667, %int0_1835, %int0_1836, %int9223372036854775807_1837, %int1_1838 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1839 = torch.constant.int 1 %int0_1840 = torch.constant.int 0 %int1_1841 = torch.constant.int 1 %1931 = torch.aten.slice_scatter %1930, %1929, %int1_1839, %int0_1840, %1910, %int1_1841 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_1842 = torch.constant.int 0 %int0_1843 = torch.constant.int 0 %int9223372036854775807_1844 = torch.constant.int 9223372036854775807 %int1_1845 = torch.constant.int 1 %1932 = torch.aten.slice_scatter %1667, %1931, %int0_1842, %int0_1843, %int9223372036854775807_1844, %int1_1845 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_1846 = torch.constant.int 0 %int0_1847 = torch.constant.int 0 %int9223372036854775807_1848 = torch.constant.int 9223372036854775807 %int1_1849 = torch.constant.int 1 %1933 = torch.aten.slice.Tensor %671, %int0_1846, %int0_1847, %int9223372036854775807_1848, %int1_1849 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1850 = torch.constant.int 1 %int0_1851 = torch.constant.int 0 %int1_1852 = torch.constant.int 1 %1934 = torch.aten.slice.Tensor %1933, %int1_1850, %int0_1851, %1910, %int1_1852 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_1853 = torch.constant.int 0 %int0_1854 = torch.constant.int 0 %int9223372036854775807_1855 = torch.constant.int 9223372036854775807 %int1_1856 = torch.constant.int 1 %1935 = torch.aten.slice.Tensor %673, %int0_1853, %int0_1854, %int9223372036854775807_1855, %int1_1856 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1857 = torch.constant.int 1 %int0_1858 = torch.constant.int 0 %int1_1859 = torch.constant.int 1 %1936 = torch.aten.slice.Tensor %1935, %int1_1857, %int0_1858, %1910, %int1_1859 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_1860 = torch.constant.int 1 %int2_1861 = torch.constant.int 2 %1937 = torch.aten.transpose.int %1773, %int1_1860, %int2_1861 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_1862 = torch.constant.int 4 %int32_1863 = torch.constant.int 32 %int1_1864 = torch.constant.int 1 %int100_1865 = torch.constant.int 100 %1938 = torch.prim.ListConstruct %int4_1862, %int32_1863, %int1_1864, %int100_1865 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1866 = torch.constant.bool false %1939 = torch.aten.expand %1937, %1938, %false_1866 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_1867 = torch.constant.int 128 %int1_1868 = torch.constant.int 1 %int100_1869 = torch.constant.int 100 %1940 = torch.prim.ListConstruct %int128_1867, %int1_1868, %int100_1869 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1941 = torch.aten.view %1939, %1940 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_1870 = torch.constant.int 0 %int0_1871 = torch.constant.int 0 %int9223372036854775807_1872 = torch.constant.int 9223372036854775807 %int1_1873 = torch.constant.int 1 %1942 = torch.aten.slice.Tensor %1915, %int0_1870, %int0_1871, %int9223372036854775807_1872, %int1_1873 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1874 = torch.constant.int 1 %int0_1875 = torch.constant.int 0 %int1_1876 = torch.constant.int 1 %1943 = torch.aten.slice.Tensor %1942, %int1_1874, %int0_1875, %1910, %int1_1876 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_1877 = torch.constant.int 1 %int2_1878 = torch.constant.int 2 %1944 = torch.aten.transpose.int %1943, %int1_1877, %int2_1878 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_1879 = torch.constant.int 2 %int3_1880 = torch.constant.int 3 %1945 = torch.aten.transpose.int %1944, %int2_1879, %int3_1880 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_1881 = torch.constant.int 1 %1946 = torch.aten.size.int %1934, %int1_1881 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_1882 = torch.constant.int 4 %int32_1883 = torch.constant.int 32 %int100_1884 = torch.constant.int 100 %1947 = torch.prim.ListConstruct %int4_1882, %int32_1883, %int100_1884, %1946 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1885 = torch.constant.bool false %1948 = torch.aten.expand %1945, %1947, %false_1885 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_1886 = torch.constant.int 0 %1949 = torch.aten.clone %1948, %int0_1886 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_1887 = torch.constant.int 128 %int100_1888 = torch.constant.int 100 %1950 = torch.prim.ListConstruct %int128_1887, %int100_1888, %1946 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1951 = torch.aten._unsafe_view %1949, %1950 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %1952 = torch.aten.bmm %1941, %1951 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_1889 = torch.constant.int 4 %int32_1890 = torch.constant.int 32 %int1_1891 = torch.constant.int 1 %1953 = torch.prim.ListConstruct %int4_1889, %int32_1890, %int1_1891, %1946 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1954 = torch.aten.view %1952, %1953 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_1892 = torch.constant.float 1.000000e+01 %1955 = torch.aten.div.Scalar %1954, %float1.000000e01_1892 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_1893 = torch.constant.int 1 %1956 = torch.aten.add.Tensor %1955, %895, %int1_1893 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_1894 = torch.constant.int -1 %false_1895 = torch.constant.bool false %1957 = torch.aten._softmax %1956, %int-1_1894, %false_1895 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_1896 = torch.constant.int 4 %int32_1897 = torch.constant.int 32 %int1_1898 = torch.constant.int 1 %1958 = torch.prim.ListConstruct %int4_1896, %int32_1897, %int1_1898, %1946 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1899 = torch.constant.bool false %1959 = torch.aten.expand %1957, %1958, %false_1899 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_1900 = torch.constant.int 128 %int1_1901 = torch.constant.int 1 %1960 = torch.prim.ListConstruct %int128_1900, %int1_1901, %1946 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1961 = torch.aten.view %1959, %1960 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_1902 = torch.constant.int 0 %int0_1903 = torch.constant.int 0 %int9223372036854775807_1904 = torch.constant.int 9223372036854775807 %int1_1905 = torch.constant.int 1 %1962 = torch.aten.slice.Tensor %1932, %int0_1902, %int0_1903, %int9223372036854775807_1904, %int1_1905 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_1906 = torch.constant.int 1 %int0_1907 = torch.constant.int 0 %int1_1908 = torch.constant.int 1 %1963 = torch.aten.slice.Tensor %1962, %int1_1906, %int0_1907, %1910, %int1_1908 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_1909 = torch.constant.int 1 %int2_1910 = torch.constant.int 2 %1964 = torch.aten.transpose.int %1963, %int1_1909, %int2_1910 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_1911 = torch.constant.int 1 %1965 = torch.aten.size.int %1936, %int1_1911 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_1912 = torch.constant.int 4 %int32_1913 = torch.constant.int 32 %int100_1914 = torch.constant.int 100 %1966 = torch.prim.ListConstruct %int4_1912, %int32_1913, %1965, %int100_1914 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_1915 = torch.constant.bool false %1967 = torch.aten.expand %1964, %1966, %false_1915 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_1916 = torch.constant.int 0 %1968 = torch.aten.clone %1967, %int0_1916 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_1917 = torch.constant.int 128 %int100_1918 = torch.constant.int 100 %1969 = torch.prim.ListConstruct %int128_1917, %1965, %int100_1918 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1970 = torch.aten._unsafe_view %1968, %1969 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %1971 = torch.aten.bmm %1961, %1970 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_1919 = torch.constant.int 4 %int32_1920 = torch.constant.int 32 %int1_1921 = torch.constant.int 1 %int100_1922 = torch.constant.int 100 %1972 = torch.prim.ListConstruct %int4_1919, %int32_1920, %int1_1921, %int100_1922 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %1973 = torch.aten.view %1971, %1972 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_1923 = torch.constant.int 1 %int2_1924 = torch.constant.int 2 %1974 = torch.aten.transpose.int %1973, %int1_1923, %int2_1924 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_1925 = torch.constant.int 4 %int1_1926 = torch.constant.int 1 %int-1_1927 = torch.constant.int -1 %1975 = torch.prim.ListConstruct %int4_1925, %int1_1926, %int-1_1927 : (!torch.int, !torch.int, !torch.int) -> !torch.list %1976 = torch.aten.view %1974, %1975 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %1977 = torch_c.to_builtin_tensor %1976 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1928 = tensor.cast %1977 : tensor<4x1x3200xf32> to tensor %1978 = torch_c.to_builtin_tensor %42 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %1979 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1928, %1978) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1929 = tensor.cast %1979 : tensor to tensor<4x1x3200xf32> %1980 = torch_c.from_builtin_tensor %cast_1929 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_1930 = torch.constant.int 1 %1981 = torch.aten.add.Tensor %1738, %1980, %int1_1930 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_1931 = torch.constant.int 2 %1982 = torch.aten.pow.Tensor_Scalar %1981, %int2_1931 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_1932 = torch.constant.int -1 %1983 = torch.prim.ListConstruct %int-1_1932 : (!torch.int) -> !torch.list %true_1933 = torch.constant.bool true %none_1934 = torch.constant.none %1984 = torch.aten.mean.dim %1982, %1983, %true_1933, %none_1934 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_1935 = torch.constant.float 9.9999999747524271E-7 %int1_1936 = torch.constant.int 1 %1985 = torch.aten.add.Scalar %1984, %float9.999990e-07_1935, %int1_1936 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %1986 = torch.aten.rsqrt %1985 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %1987 = torch.aten.mul.Tensor %1981, %1986 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %1988 = torch.aten.mul.Tensor %1987, %43 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %1989 = torch_c.to_builtin_tensor %1988 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1937 = tensor.cast %1989 : tensor<4x1x3200xf32> to tensor %1990 = torch_c.to_builtin_tensor %44 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %1991 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_1937, %1990) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_1938 = tensor.cast %1991 : tensor to tensor<4x1x8640xf32> %1992 = torch_c.from_builtin_tensor %cast_1938 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %1993 = torch.aten.silu %1992 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %1994 = torch_c.to_builtin_tensor %1988 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1939 = tensor.cast %1994 : tensor<4x1x3200xf32> to tensor %1995 = torch_c.to_builtin_tensor %45 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %1996 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_1939, %1995) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_1940 = tensor.cast %1996 : tensor to tensor<4x1x8640xf32> %1997 = torch_c.from_builtin_tensor %cast_1940 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %1998 = torch.aten.mul.Tensor %1993, %1997 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %1999 = torch_c.to_builtin_tensor %1998 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_1941 = tensor.cast %1999 : tensor<4x1x8640xf32> to tensor %2000 = torch_c.to_builtin_tensor %46 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %2001 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_1941, %2000) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_1942 = tensor.cast %2001 : tensor to tensor<4x1x3200xf32> %2002 = torch_c.from_builtin_tensor %cast_1942 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_1943 = torch.constant.int 1 %2003 = torch.aten.add.Tensor %1981, %2002, %int1_1943 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_1944 = torch.constant.int 2 %2004 = torch.aten.pow.Tensor_Scalar %2003, %int2_1944 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_1945 = torch.constant.int -1 %2005 = torch.prim.ListConstruct %int-1_1945 : (!torch.int) -> !torch.list %true_1946 = torch.constant.bool true %none_1947 = torch.constant.none %2006 = torch.aten.mean.dim %2004, %2005, %true_1946, %none_1947 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_1948 = torch.constant.float 9.9999999747524271E-7 %int1_1949 = torch.constant.int 1 %2007 = torch.aten.add.Scalar %2006, %float9.999990e-07_1948, %int1_1949 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %2008 = torch.aten.rsqrt %2007 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %2009 = torch.aten.mul.Tensor %2003, %2008 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %2010 = torch.aten.mul.Tensor %2009, %47 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %2011 = torch_c.to_builtin_tensor %2010 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1950 = tensor.cast %2011 : tensor<4x1x3200xf32> to tensor %2012 = torch_c.to_builtin_tensor %48 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2013 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1950, %2012) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1951 = tensor.cast %2013 : tensor to tensor<4x1x3200xf32> %2014 = torch_c.from_builtin_tensor %cast_1951 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %2015 = torch_c.to_builtin_tensor %2010 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1952 = tensor.cast %2015 : tensor<4x1x3200xf32> to tensor %2016 = torch_c.to_builtin_tensor %49 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2017 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1952, %2016) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1953 = tensor.cast %2017 : tensor to tensor<4x1x3200xf32> %2018 = torch_c.from_builtin_tensor %cast_1953 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %2019 = torch_c.to_builtin_tensor %2010 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_1954 = tensor.cast %2019 : tensor<4x1x3200xf32> to tensor %2020 = torch_c.to_builtin_tensor %50 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2021 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_1954, %2020) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_1955 = tensor.cast %2021 : tensor to tensor<4x1x3200xf32> %2022 = torch_c.from_builtin_tensor %cast_1955 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_1956 = torch.constant.int 4 %int1_1957 = torch.constant.int 1 %int32_1958 = torch.constant.int 32 %int100_1959 = torch.constant.int 100 %2023 = torch.prim.ListConstruct %int4_1956, %int1_1957, %int32_1958, %int100_1959 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2024 = torch.aten.view %2014, %2023 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_1960 = torch.constant.int 4 %int1_1961 = torch.constant.int 1 %int32_1962 = torch.constant.int 32 %int100_1963 = torch.constant.int 100 %2025 = torch.prim.ListConstruct %int4_1960, %int1_1961, %int32_1962, %int100_1963 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2026 = torch.aten.view %2018, %2025 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_1964 = torch.constant.int 4 %int1_1965 = torch.constant.int 1 %int32_1966 = torch.constant.int 32 %int100_1967 = torch.constant.int 100 %2027 = torch.prim.ListConstruct %int4_1964, %int1_1965, %int32_1966, %int100_1967 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2028 = torch.aten.view %2022, %2027 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_1968 = torch.constant.int 4 %int1_1969 = torch.constant.int 1 %int32_1970 = torch.constant.int 32 %int-1_1971 = torch.constant.int -1 %int2_1972 = torch.constant.int 2 %2029 = torch.prim.ListConstruct %int4_1968, %int1_1969, %int32_1970, %int-1_1971, %int2_1972 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2030 = torch.aten.view %2024, %2029 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %2031 = torch.aten.view_as_complex %2030 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_1973 = torch.constant.int 4 %int1_1974 = torch.constant.int 1 %int32_1975 = torch.constant.int 32 %int-1_1976 = torch.constant.int -1 %int2_1977 = torch.constant.int 2 %2032 = torch.prim.ListConstruct %int4_1973, %int1_1974, %int32_1975, %int-1_1976, %int2_1977 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2033 = torch.aten.view %2026, %2032 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %2034 = torch.aten.view_as_complex %2033 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %2035 = torch.aten.mul.Tensor %2031, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %2036 = torch.aten.view_as_real %2035 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_1978 = torch.constant.int 4 %int1_1979 = torch.constant.int 1 %int32_1980 = torch.constant.int 32 %int100_1981 = torch.constant.int 100 %2037 = torch.prim.ListConstruct %int4_1978, %int1_1979, %int32_1980, %int100_1981 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2038 = torch.aten.view %2036, %2037 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %2039 = torch.aten.mul.Tensor %2034, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %2040 = torch.aten.view_as_real %2039 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_1982 = torch.constant.int 4 %int1_1983 = torch.constant.int 1 %int32_1984 = torch.constant.int 32 %int100_1985 = torch.constant.int 100 %2041 = torch.prim.ListConstruct %int4_1982, %int1_1983, %int32_1984, %int100_1985 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2042 = torch.aten.view %2040, %2041 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_1986 = torch.constant.int 1 %int1_1987 = torch.constant.int 1 %2043 = torch.aten.add.Scalar %arg2, %int1_1986, %int1_1987 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_1988 = torch.constant.int 0 %int0_1989 = torch.constant.int 0 %2044 = torch.aten.select.int %2043, %int0_1988, %int0_1989 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_1990 = torch.constant.int 0 %int0_1991 = torch.constant.int 0 %2045 = torch.aten.select.int %arg3, %int0_1990, %int0_1991 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_1992 = torch.constant.int 0 %int0_1993 = torch.constant.int 0 %int9223372036854775807_1994 = torch.constant.int 9223372036854775807 %int1_1995 = torch.constant.int 1 %2046 = torch.aten.slice.Tensor %2045, %int0_1992, %int0_1993, %int9223372036854775807_1994, %int1_1995 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_1996 = torch.constant.int 16 %2047 = torch.aten.floor_divide.Scalar %2044, %int16_1996 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_1997 = torch.constant.int 0 %2048 = torch.aten.index_select %2046, %int0_1997, %2047 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_1998 = torch.constant.int 16 %2049 = torch.aten.remainder.Scalar %2044, %int16_1998 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_1999 = torch.constant.none %2050 = torch.aten.clone %318, %none_1999 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2000 = torch.constant.none %2051 = torch.aten.clone %319, %none_2000 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2001 = torch.constant.int 0 %2052 = torch.aten.unsqueeze %2049, %int0_2001 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2002 = torch.constant.int 0 %int0_2003 = torch.constant.int 0 %2053 = torch.aten.select.int %2042, %int0_2002, %int0_2003 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2004 = torch.constant.int 0 %int0_2005 = torch.constant.int 0 %2054 = torch.aten.select.int %2053, %int0_2004, %int0_2005 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_2006 = torch.constant.int -1 %int26_2007 = torch.constant.int 26 %int2_2008 = torch.constant.int 2 %int16_2009 = torch.constant.int 16 %int32_2010 = torch.constant.int 32 %int100_2011 = torch.constant.int 100 %2055 = torch.prim.ListConstruct %int-1_2006, %int26_2007, %int2_2008, %int16_2009, %int32_2010, %int100_2011 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2056 = torch.aten.view %1890, %2055 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %2057 = torch.prim.ListConstruct %2048, %2050, %2051, %2052 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2012 = torch.constant.bool false %2058 = torch.aten.index_put %2056, %2057, %2054, %false_2012 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2013 = torch.constant.int 2662400 %2059 = torch.prim.ListConstruct %731, %int2662400_2013 : (!torch.int, !torch.int) -> !torch.list %2060 = torch.aten.view %2058, %2059 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2014 = torch.constant.int -1 %int26_2015 = torch.constant.int 26 %int2_2016 = torch.constant.int 2 %int16_2017 = torch.constant.int 16 %int32_2018 = torch.constant.int 32 %int100_2019 = torch.constant.int 100 %2061 = torch.prim.ListConstruct %int-1_2014, %int26_2015, %int2_2016, %int16_2017, %int32_2018, %int100_2019 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2062 = torch.aten.view %2060, %2061 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2020 = torch.constant.none %2063 = torch.aten.clone %320, %none_2020 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2021 = torch.constant.none %2064 = torch.aten.clone %321, %none_2021 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2022 = torch.constant.int 0 %2065 = torch.aten.unsqueeze %2049, %int0_2022 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2023 = torch.constant.int 0 %int0_2024 = torch.constant.int 0 %2066 = torch.aten.select.int %2028, %int0_2023, %int0_2024 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2025 = torch.constant.int 0 %int0_2026 = torch.constant.int 0 %2067 = torch.aten.select.int %2066, %int0_2025, %int0_2026 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2068 = torch.prim.ListConstruct %2048, %2063, %2064, %2065 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2027 = torch.constant.bool false %2069 = torch.aten.index_put %2062, %2068, %2067, %false_2027 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2028 = torch.constant.int 2662400 %2070 = torch.prim.ListConstruct %731, %int2662400_2028 : (!torch.int, !torch.int) -> !torch.list %2071 = torch.aten.view %2069, %2070 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2029 = torch.constant.int -1 %int26_2030 = torch.constant.int 26 %int2_2031 = torch.constant.int 2 %int16_2032 = torch.constant.int 16 %int32_2033 = torch.constant.int 32 %int100_2034 = torch.constant.int 100 %2072 = torch.prim.ListConstruct %int-1_2029, %int26_2030, %int2_2031, %int16_2032, %int32_2033, %int100_2034 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2073 = torch.aten.view %2071, %2072 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_2035 = torch.constant.int 0 %int1_2036 = torch.constant.int 1 %2074 = torch.aten.select.int %2043, %int0_2035, %int1_2036 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2037 = torch.constant.int 0 %int1_2038 = torch.constant.int 1 %2075 = torch.aten.select.int %arg3, %int0_2037, %int1_2038 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2039 = torch.constant.int 0 %int0_2040 = torch.constant.int 0 %int9223372036854775807_2041 = torch.constant.int 9223372036854775807 %int1_2042 = torch.constant.int 1 %2076 = torch.aten.slice.Tensor %2075, %int0_2039, %int0_2040, %int9223372036854775807_2041, %int1_2042 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2043 = torch.constant.int 16 %2077 = torch.aten.floor_divide.Scalar %2074, %int16_2043 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2044 = torch.constant.int 0 %2078 = torch.aten.index_select %2076, %int0_2044, %2077 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2045 = torch.constant.int 16 %2079 = torch.aten.remainder.Scalar %2074, %int16_2045 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2046 = torch.constant.none %2080 = torch.aten.clone %322, %none_2046 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2047 = torch.constant.none %2081 = torch.aten.clone %323, %none_2047 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2048 = torch.constant.int 0 %2082 = torch.aten.unsqueeze %2079, %int0_2048 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2049 = torch.constant.int 0 %int1_2050 = torch.constant.int 1 %2083 = torch.aten.select.int %2042, %int0_2049, %int1_2050 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2051 = torch.constant.int 0 %int0_2052 = torch.constant.int 0 %2084 = torch.aten.select.int %2083, %int0_2051, %int0_2052 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2085 = torch.prim.ListConstruct %2078, %2080, %2081, %2082 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2053 = torch.constant.bool false %2086 = torch.aten.index_put %2073, %2085, %2084, %false_2053 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2054 = torch.constant.int 2662400 %2087 = torch.prim.ListConstruct %731, %int2662400_2054 : (!torch.int, !torch.int) -> !torch.list %2088 = torch.aten.view %2086, %2087 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2055 = torch.constant.int -1 %int26_2056 = torch.constant.int 26 %int2_2057 = torch.constant.int 2 %int16_2058 = torch.constant.int 16 %int32_2059 = torch.constant.int 32 %int100_2060 = torch.constant.int 100 %2089 = torch.prim.ListConstruct %int-1_2055, %int26_2056, %int2_2057, %int16_2058, %int32_2059, %int100_2060 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2090 = torch.aten.view %2088, %2089 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2061 = torch.constant.none %2091 = torch.aten.clone %324, %none_2061 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2062 = torch.constant.none %2092 = torch.aten.clone %325, %none_2062 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2063 = torch.constant.int 0 %2093 = torch.aten.unsqueeze %2079, %int0_2063 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2064 = torch.constant.int 0 %int1_2065 = torch.constant.int 1 %2094 = torch.aten.select.int %2028, %int0_2064, %int1_2065 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2066 = torch.constant.int 0 %int0_2067 = torch.constant.int 0 %2095 = torch.aten.select.int %2094, %int0_2066, %int0_2067 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2096 = torch.prim.ListConstruct %2078, %2091, %2092, %2093 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2068 = torch.constant.bool false %2097 = torch.aten.index_put %2090, %2096, %2095, %false_2068 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2069 = torch.constant.int 2662400 %2098 = torch.prim.ListConstruct %731, %int2662400_2069 : (!torch.int, !torch.int) -> !torch.list %2099 = torch.aten.view %2097, %2098 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2070 = torch.constant.int -1 %int26_2071 = torch.constant.int 26 %int2_2072 = torch.constant.int 2 %int16_2073 = torch.constant.int 16 %int32_2074 = torch.constant.int 32 %int100_2075 = torch.constant.int 100 %2100 = torch.prim.ListConstruct %int-1_2070, %int26_2071, %int2_2072, %int16_2073, %int32_2074, %int100_2075 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2101 = torch.aten.view %2099, %2100 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_2076 = torch.constant.int 0 %int2_2077 = torch.constant.int 2 %2102 = torch.aten.select.int %2043, %int0_2076, %int2_2077 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2078 = torch.constant.int 0 %int2_2079 = torch.constant.int 2 %2103 = torch.aten.select.int %arg3, %int0_2078, %int2_2079 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2080 = torch.constant.int 0 %int0_2081 = torch.constant.int 0 %int9223372036854775807_2082 = torch.constant.int 9223372036854775807 %int1_2083 = torch.constant.int 1 %2104 = torch.aten.slice.Tensor %2103, %int0_2080, %int0_2081, %int9223372036854775807_2082, %int1_2083 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2084 = torch.constant.int 16 %2105 = torch.aten.floor_divide.Scalar %2102, %int16_2084 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2085 = torch.constant.int 0 %2106 = torch.aten.index_select %2104, %int0_2085, %2105 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2086 = torch.constant.int 16 %2107 = torch.aten.remainder.Scalar %2102, %int16_2086 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2087 = torch.constant.none %2108 = torch.aten.clone %326, %none_2087 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2088 = torch.constant.none %2109 = torch.aten.clone %327, %none_2088 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2089 = torch.constant.int 0 %2110 = torch.aten.unsqueeze %2107, %int0_2089 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2090 = torch.constant.int 0 %int2_2091 = torch.constant.int 2 %2111 = torch.aten.select.int %2042, %int0_2090, %int2_2091 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2092 = torch.constant.int 0 %int0_2093 = torch.constant.int 0 %2112 = torch.aten.select.int %2111, %int0_2092, %int0_2093 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2113 = torch.prim.ListConstruct %2106, %2108, %2109, %2110 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2094 = torch.constant.bool false %2114 = torch.aten.index_put %2101, %2113, %2112, %false_2094 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2095 = torch.constant.int 2662400 %2115 = torch.prim.ListConstruct %731, %int2662400_2095 : (!torch.int, !torch.int) -> !torch.list %2116 = torch.aten.view %2114, %2115 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2096 = torch.constant.int -1 %int26_2097 = torch.constant.int 26 %int2_2098 = torch.constant.int 2 %int16_2099 = torch.constant.int 16 %int32_2100 = torch.constant.int 32 %int100_2101 = torch.constant.int 100 %2117 = torch.prim.ListConstruct %int-1_2096, %int26_2097, %int2_2098, %int16_2099, %int32_2100, %int100_2101 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2118 = torch.aten.view %2116, %2117 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2102 = torch.constant.none %2119 = torch.aten.clone %328, %none_2102 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2103 = torch.constant.none %2120 = torch.aten.clone %329, %none_2103 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2104 = torch.constant.int 0 %2121 = torch.aten.unsqueeze %2107, %int0_2104 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2105 = torch.constant.int 0 %int2_2106 = torch.constant.int 2 %2122 = torch.aten.select.int %2028, %int0_2105, %int2_2106 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2107 = torch.constant.int 0 %int0_2108 = torch.constant.int 0 %2123 = torch.aten.select.int %2122, %int0_2107, %int0_2108 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2124 = torch.prim.ListConstruct %2106, %2119, %2120, %2121 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2109 = torch.constant.bool false %2125 = torch.aten.index_put %2118, %2124, %2123, %false_2109 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2110 = torch.constant.int 2662400 %2126 = torch.prim.ListConstruct %731, %int2662400_2110 : (!torch.int, !torch.int) -> !torch.list %2127 = torch.aten.view %2125, %2126 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2111 = torch.constant.int -1 %int26_2112 = torch.constant.int 26 %int2_2113 = torch.constant.int 2 %int16_2114 = torch.constant.int 16 %int32_2115 = torch.constant.int 32 %int100_2116 = torch.constant.int 100 %2128 = torch.prim.ListConstruct %int-1_2111, %int26_2112, %int2_2113, %int16_2114, %int32_2115, %int100_2116 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2129 = torch.aten.view %2127, %2128 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_2117 = torch.constant.int 0 %int3_2118 = torch.constant.int 3 %2130 = torch.aten.select.int %2043, %int0_2117, %int3_2118 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2119 = torch.constant.int 0 %int3_2120 = torch.constant.int 3 %2131 = torch.aten.select.int %arg3, %int0_2119, %int3_2120 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2121 = torch.constant.int 0 %int0_2122 = torch.constant.int 0 %int9223372036854775807_2123 = torch.constant.int 9223372036854775807 %int1_2124 = torch.constant.int 1 %2132 = torch.aten.slice.Tensor %2131, %int0_2121, %int0_2122, %int9223372036854775807_2123, %int1_2124 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2125 = torch.constant.int 16 %2133 = torch.aten.floor_divide.Scalar %2130, %int16_2125 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2126 = torch.constant.int 0 %2134 = torch.aten.index_select %2132, %int0_2126, %2133 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2127 = torch.constant.int 16 %2135 = torch.aten.remainder.Scalar %2130, %int16_2127 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2128 = torch.constant.none %2136 = torch.aten.clone %330, %none_2128 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2129 = torch.constant.none %2137 = torch.aten.clone %331, %none_2129 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2130 = torch.constant.int 0 %2138 = torch.aten.unsqueeze %2135, %int0_2130 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2131 = torch.constant.int 0 %int3_2132 = torch.constant.int 3 %2139 = torch.aten.select.int %2042, %int0_2131, %int3_2132 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2133 = torch.constant.int 0 %int0_2134 = torch.constant.int 0 %2140 = torch.aten.select.int %2139, %int0_2133, %int0_2134 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2141 = torch.prim.ListConstruct %2134, %2136, %2137, %2138 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2135 = torch.constant.bool false %2142 = torch.aten.index_put %2129, %2141, %2140, %false_2135 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2136 = torch.constant.int 2662400 %2143 = torch.prim.ListConstruct %731, %int2662400_2136 : (!torch.int, !torch.int) -> !torch.list %2144 = torch.aten.view %2142, %2143 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2137 = torch.constant.int -1 %int26_2138 = torch.constant.int 26 %int2_2139 = torch.constant.int 2 %int16_2140 = torch.constant.int 16 %int32_2141 = torch.constant.int 32 %int100_2142 = torch.constant.int 100 %2145 = torch.prim.ListConstruct %int-1_2137, %int26_2138, %int2_2139, %int16_2140, %int32_2141, %int100_2142 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2146 = torch.aten.view %2144, %2145 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2143 = torch.constant.none %2147 = torch.aten.clone %332, %none_2143 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2144 = torch.constant.none %2148 = torch.aten.clone %333, %none_2144 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2145 = torch.constant.int 0 %2149 = torch.aten.unsqueeze %2135, %int0_2145 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2146 = torch.constant.int 0 %int3_2147 = torch.constant.int 3 %2150 = torch.aten.select.int %2028, %int0_2146, %int3_2147 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2148 = torch.constant.int 0 %int0_2149 = torch.constant.int 0 %2151 = torch.aten.select.int %2150, %int0_2148, %int0_2149 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2152 = torch.prim.ListConstruct %2134, %2147, %2148, %2149 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2150 = torch.constant.bool false %2153 = torch.aten.index_put %2146, %2152, %2151, %false_2150 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2151 = torch.constant.int 2662400 %2154 = torch.prim.ListConstruct %731, %int2662400_2151 : (!torch.int, !torch.int) -> !torch.list %2155 = torch.aten.view %2153, %2154 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_2152 = torch.constant.int 52 %2156 = torch.aten.mul.Scalar %arg3, %int52_2152 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int10 = torch.constant.int 10 %int1_2153 = torch.constant.int 1 %2157 = torch.aten.add.Scalar %2156, %int10, %int1_2153 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_2154 = torch.constant.int 4 %2158 = torch.aten.mul.int %int4_2154, %655 : !torch.int, !torch.int -> !torch.int %2159 = torch.prim.ListConstruct %2158 : (!torch.int) -> !torch.list %2160 = torch.aten.view %2157, %2159 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_2155 = torch.constant.int -1 %int26_2156 = torch.constant.int 26 %int2_2157 = torch.constant.int 2 %int16_2158 = torch.constant.int 16 %int32_2159 = torch.constant.int 32 %int100_2160 = torch.constant.int 100 %2161 = torch.prim.ListConstruct %int-1_2155, %int26_2156, %int2_2157, %int16_2158, %int32_2159, %int100_2160 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2162 = torch.aten.view %2155, %2161 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_2161 = torch.constant.int 26 %2163 = torch.aten.mul.int %731, %int26_2161 : !torch.int, !torch.int -> !torch.int %int2_2162 = torch.constant.int 2 %2164 = torch.aten.mul.int %2163, %int2_2162 : !torch.int, !torch.int -> !torch.int %int16_2163 = torch.constant.int 16 %int32_2164 = torch.constant.int 32 %int100_2165 = torch.constant.int 100 %2165 = torch.prim.ListConstruct %2164, %int16_2163, %int32_2164, %int100_2165 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2166 = torch.aten.view %2162, %2165 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_2166 = torch.constant.int 0 %2167 = torch.aten.index_select %2166, %int0_2166, %2160 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_2167 = torch.constant.int 4 %int16_2168 = torch.constant.int 16 %int32_2169 = torch.constant.int 32 %int100_2170 = torch.constant.int 100 %2168 = torch.prim.ListConstruct %int4_2167, %655, %int16_2168, %int32_2169, %int100_2170 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2169 = torch.aten.view %2167, %2168 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_2171 = torch.constant.int 1 %2170 = torch.aten.size.int %2169, %int1_2171 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_2172 = torch.constant.int 16 %2171 = torch.aten.mul.int %2170, %int16_2172 : !torch.int, !torch.int -> !torch.int %int4_2173 = torch.constant.int 4 %int32_2174 = torch.constant.int 32 %int100_2175 = torch.constant.int 100 %2172 = torch.prim.ListConstruct %int4_2173, %2171, %int32_2174, %int100_2175 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2173 = torch.aten.view %2169, %2172 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_2176 = torch.constant.int 0 %int0_2177 = torch.constant.int 0 %int9223372036854775807_2178 = torch.constant.int 9223372036854775807 %int1_2179 = torch.constant.int 1 %2174 = torch.aten.slice.Tensor %1915, %int0_2176, %int0_2177, %int9223372036854775807_2178, %int1_2179 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_2180 = torch.constant.int 16 %2175 = torch.aten.mul.int %655, %int16_2180 : !torch.int, !torch.int -> !torch.int %int1_2181 = torch.constant.int 1 %int0_2182 = torch.constant.int 0 %int1_2183 = torch.constant.int 1 %2176 = torch.aten.slice.Tensor %2174, %int1_2181, %int0_2182, %2175, %int1_2183 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_2184 = torch.constant.bool false %2177 = torch.aten.copy %2176, %2173, %false_2184 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_2185 = torch.constant.int 0 %int0_2186 = torch.constant.int 0 %int9223372036854775807_2187 = torch.constant.int 9223372036854775807 %int1_2188 = torch.constant.int 1 %2178 = torch.aten.slice.Tensor %1915, %int0_2185, %int0_2186, %int9223372036854775807_2187, %int1_2188 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2189 = torch.constant.int 1 %int0_2190 = torch.constant.int 0 %int1_2191 = torch.constant.int 1 %2179 = torch.aten.slice_scatter %2178, %2177, %int1_2189, %int0_2190, %2175, %int1_2191 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_2192 = torch.constant.int 0 %int0_2193 = torch.constant.int 0 %int9223372036854775807_2194 = torch.constant.int 9223372036854775807 %int1_2195 = torch.constant.int 1 %2180 = torch.aten.slice_scatter %1915, %2179, %int0_2192, %int0_2193, %int9223372036854775807_2194, %int1_2195 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2196 = torch.constant.int 1 %int1_2197 = torch.constant.int 1 %2181 = torch.aten.add.Scalar %2157, %int1_2196, %int1_2197 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_2198 = torch.constant.int 4 %2182 = torch.aten.mul.int %int4_2198, %655 : !torch.int, !torch.int -> !torch.int %2183 = torch.prim.ListConstruct %2182 : (!torch.int) -> !torch.list %2184 = torch.aten.view %2181, %2183 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_2199 = torch.constant.int 0 %2185 = torch.aten.index_select %2166, %int0_2199, %2184 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_2200 = torch.constant.int 4 %int16_2201 = torch.constant.int 16 %int32_2202 = torch.constant.int 32 %int100_2203 = torch.constant.int 100 %2186 = torch.prim.ListConstruct %int4_2200, %655, %int16_2201, %int32_2202, %int100_2203 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2187 = torch.aten.view %2185, %2186 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_2204 = torch.constant.int 1 %2188 = torch.aten.size.int %2187, %int1_2204 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_2205 = torch.constant.int 16 %2189 = torch.aten.mul.int %2188, %int16_2205 : !torch.int, !torch.int -> !torch.int %int4_2206 = torch.constant.int 4 %int32_2207 = torch.constant.int 32 %int100_2208 = torch.constant.int 100 %2190 = torch.prim.ListConstruct %int4_2206, %2189, %int32_2207, %int100_2208 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2191 = torch.aten.view %2187, %2190 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_2209 = torch.constant.int 0 %int0_2210 = torch.constant.int 0 %int9223372036854775807_2211 = torch.constant.int 9223372036854775807 %int1_2212 = torch.constant.int 1 %2192 = torch.aten.slice.Tensor %1932, %int0_2209, %int0_2210, %int9223372036854775807_2211, %int1_2212 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2213 = torch.constant.int 1 %int0_2214 = torch.constant.int 0 %int1_2215 = torch.constant.int 1 %2193 = torch.aten.slice.Tensor %2192, %int1_2213, %int0_2214, %2175, %int1_2215 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_2216 = torch.constant.bool false %2194 = torch.aten.copy %2193, %2191, %false_2216 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_2217 = torch.constant.int 0 %int0_2218 = torch.constant.int 0 %int9223372036854775807_2219 = torch.constant.int 9223372036854775807 %int1_2220 = torch.constant.int 1 %2195 = torch.aten.slice.Tensor %1932, %int0_2217, %int0_2218, %int9223372036854775807_2219, %int1_2220 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2221 = torch.constant.int 1 %int0_2222 = torch.constant.int 0 %int1_2223 = torch.constant.int 1 %2196 = torch.aten.slice_scatter %2195, %2194, %int1_2221, %int0_2222, %2175, %int1_2223 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_2224 = torch.constant.int 0 %int0_2225 = torch.constant.int 0 %int9223372036854775807_2226 = torch.constant.int 9223372036854775807 %int1_2227 = torch.constant.int 1 %2197 = torch.aten.slice_scatter %1932, %2196, %int0_2224, %int0_2225, %int9223372036854775807_2226, %int1_2227 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_2228 = torch.constant.int 0 %int0_2229 = torch.constant.int 0 %int9223372036854775807_2230 = torch.constant.int 9223372036854775807 %int1_2231 = torch.constant.int 1 %2198 = torch.aten.slice.Tensor %671, %int0_2228, %int0_2229, %int9223372036854775807_2230, %int1_2231 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2232 = torch.constant.int 1 %int0_2233 = torch.constant.int 0 %int1_2234 = torch.constant.int 1 %2199 = torch.aten.slice.Tensor %2198, %int1_2232, %int0_2233, %2175, %int1_2234 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_2235 = torch.constant.int 0 %int0_2236 = torch.constant.int 0 %int9223372036854775807_2237 = torch.constant.int 9223372036854775807 %int1_2238 = torch.constant.int 1 %2200 = torch.aten.slice.Tensor %673, %int0_2235, %int0_2236, %int9223372036854775807_2237, %int1_2238 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2239 = torch.constant.int 1 %int0_2240 = torch.constant.int 0 %int1_2241 = torch.constant.int 1 %2201 = torch.aten.slice.Tensor %2200, %int1_2239, %int0_2240, %2175, %int1_2241 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_2242 = torch.constant.int 1 %int2_2243 = torch.constant.int 2 %2202 = torch.aten.transpose.int %2038, %int1_2242, %int2_2243 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_2244 = torch.constant.int 4 %int32_2245 = torch.constant.int 32 %int1_2246 = torch.constant.int 1 %int100_2247 = torch.constant.int 100 %2203 = torch.prim.ListConstruct %int4_2244, %int32_2245, %int1_2246, %int100_2247 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_2248 = torch.constant.bool false %2204 = torch.aten.expand %2202, %2203, %false_2248 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_2249 = torch.constant.int 128 %int1_2250 = torch.constant.int 1 %int100_2251 = torch.constant.int 100 %2205 = torch.prim.ListConstruct %int128_2249, %int1_2250, %int100_2251 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2206 = torch.aten.view %2204, %2205 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_2252 = torch.constant.int 0 %int0_2253 = torch.constant.int 0 %int9223372036854775807_2254 = torch.constant.int 9223372036854775807 %int1_2255 = torch.constant.int 1 %2207 = torch.aten.slice.Tensor %2180, %int0_2252, %int0_2253, %int9223372036854775807_2254, %int1_2255 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2256 = torch.constant.int 1 %int0_2257 = torch.constant.int 0 %int1_2258 = torch.constant.int 1 %2208 = torch.aten.slice.Tensor %2207, %int1_2256, %int0_2257, %2175, %int1_2258 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_2259 = torch.constant.int 1 %int2_2260 = torch.constant.int 2 %2209 = torch.aten.transpose.int %2208, %int1_2259, %int2_2260 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_2261 = torch.constant.int 2 %int3_2262 = torch.constant.int 3 %2210 = torch.aten.transpose.int %2209, %int2_2261, %int3_2262 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_2263 = torch.constant.int 1 %2211 = torch.aten.size.int %2199, %int1_2263 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_2264 = torch.constant.int 4 %int32_2265 = torch.constant.int 32 %int100_2266 = torch.constant.int 100 %2212 = torch.prim.ListConstruct %int4_2264, %int32_2265, %int100_2266, %2211 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_2267 = torch.constant.bool false %2213 = torch.aten.expand %2210, %2212, %false_2267 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_2268 = torch.constant.int 0 %2214 = torch.aten.clone %2213, %int0_2268 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_2269 = torch.constant.int 128 %int100_2270 = torch.constant.int 100 %2215 = torch.prim.ListConstruct %int128_2269, %int100_2270, %2211 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2216 = torch.aten._unsafe_view %2214, %2215 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %2217 = torch.aten.bmm %2206, %2216 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_2271 = torch.constant.int 4 %int32_2272 = torch.constant.int 32 %int1_2273 = torch.constant.int 1 %2218 = torch.prim.ListConstruct %int4_2271, %int32_2272, %int1_2273, %2211 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2219 = torch.aten.view %2217, %2218 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_2274 = torch.constant.float 1.000000e+01 %2220 = torch.aten.div.Scalar %2219, %float1.000000e01_2274 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_2275 = torch.constant.int 1 %2221 = torch.aten.add.Tensor %2220, %895, %int1_2275 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_2276 = torch.constant.int -1 %false_2277 = torch.constant.bool false %2222 = torch.aten._softmax %2221, %int-1_2276, %false_2277 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_2278 = torch.constant.int 4 %int32_2279 = torch.constant.int 32 %int1_2280 = torch.constant.int 1 %2223 = torch.prim.ListConstruct %int4_2278, %int32_2279, %int1_2280, %2211 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_2281 = torch.constant.bool false %2224 = torch.aten.expand %2222, %2223, %false_2281 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_2282 = torch.constant.int 128 %int1_2283 = torch.constant.int 1 %2225 = torch.prim.ListConstruct %int128_2282, %int1_2283, %2211 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2226 = torch.aten.view %2224, %2225 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_2284 = torch.constant.int 0 %int0_2285 = torch.constant.int 0 %int9223372036854775807_2286 = torch.constant.int 9223372036854775807 %int1_2287 = torch.constant.int 1 %2227 = torch.aten.slice.Tensor %2197, %int0_2284, %int0_2285, %int9223372036854775807_2286, %int1_2287 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2288 = torch.constant.int 1 %int0_2289 = torch.constant.int 0 %int1_2290 = torch.constant.int 1 %2228 = torch.aten.slice.Tensor %2227, %int1_2288, %int0_2289, %2175, %int1_2290 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_2291 = torch.constant.int 1 %int2_2292 = torch.constant.int 2 %2229 = torch.aten.transpose.int %2228, %int1_2291, %int2_2292 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_2293 = torch.constant.int 1 %2230 = torch.aten.size.int %2201, %int1_2293 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_2294 = torch.constant.int 4 %int32_2295 = torch.constant.int 32 %int100_2296 = torch.constant.int 100 %2231 = torch.prim.ListConstruct %int4_2294, %int32_2295, %2230, %int100_2296 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_2297 = torch.constant.bool false %2232 = torch.aten.expand %2229, %2231, %false_2297 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_2298 = torch.constant.int 0 %2233 = torch.aten.clone %2232, %int0_2298 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_2299 = torch.constant.int 128 %int100_2300 = torch.constant.int 100 %2234 = torch.prim.ListConstruct %int128_2299, %2230, %int100_2300 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2235 = torch.aten._unsafe_view %2233, %2234 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %2236 = torch.aten.bmm %2226, %2235 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_2301 = torch.constant.int 4 %int32_2302 = torch.constant.int 32 %int1_2303 = torch.constant.int 1 %int100_2304 = torch.constant.int 100 %2237 = torch.prim.ListConstruct %int4_2301, %int32_2302, %int1_2303, %int100_2304 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2238 = torch.aten.view %2236, %2237 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_2305 = torch.constant.int 1 %int2_2306 = torch.constant.int 2 %2239 = torch.aten.transpose.int %2238, %int1_2305, %int2_2306 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_2307 = torch.constant.int 4 %int1_2308 = torch.constant.int 1 %int-1_2309 = torch.constant.int -1 %2240 = torch.prim.ListConstruct %int4_2307, %int1_2308, %int-1_2309 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2241 = torch.aten.view %2239, %2240 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %2242 = torch_c.to_builtin_tensor %2241 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2310 = tensor.cast %2242 : tensor<4x1x3200xf32> to tensor %2243 = torch_c.to_builtin_tensor %51 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2244 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_2310, %2243) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_2311 = tensor.cast %2244 : tensor to tensor<4x1x3200xf32> %2245 = torch_c.from_builtin_tensor %cast_2311 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_2312 = torch.constant.int 1 %2246 = torch.aten.add.Tensor %2003, %2245, %int1_2312 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_2313 = torch.constant.int 2 %2247 = torch.aten.pow.Tensor_Scalar %2246, %int2_2313 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_2314 = torch.constant.int -1 %2248 = torch.prim.ListConstruct %int-1_2314 : (!torch.int) -> !torch.list %true_2315 = torch.constant.bool true %none_2316 = torch.constant.none %2249 = torch.aten.mean.dim %2247, %2248, %true_2315, %none_2316 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_2317 = torch.constant.float 9.9999999747524271E-7 %int1_2318 = torch.constant.int 1 %2250 = torch.aten.add.Scalar %2249, %float9.999990e-07_2317, %int1_2318 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %2251 = torch.aten.rsqrt %2250 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %2252 = torch.aten.mul.Tensor %2246, %2251 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %2253 = torch.aten.mul.Tensor %2252, %52 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %2254 = torch_c.to_builtin_tensor %2253 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2319 = tensor.cast %2254 : tensor<4x1x3200xf32> to tensor %2255 = torch_c.to_builtin_tensor %53 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %2256 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_2319, %2255) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_2320 = tensor.cast %2256 : tensor to tensor<4x1x8640xf32> %2257 = torch_c.from_builtin_tensor %cast_2320 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %2258 = torch.aten.silu %2257 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %2259 = torch_c.to_builtin_tensor %2253 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2321 = tensor.cast %2259 : tensor<4x1x3200xf32> to tensor %2260 = torch_c.to_builtin_tensor %54 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %2261 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_2321, %2260) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_2322 = tensor.cast %2261 : tensor to tensor<4x1x8640xf32> %2262 = torch_c.from_builtin_tensor %cast_2322 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %2263 = torch.aten.mul.Tensor %2258, %2262 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %2264 = torch_c.to_builtin_tensor %2263 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_2323 = tensor.cast %2264 : tensor<4x1x8640xf32> to tensor %2265 = torch_c.to_builtin_tensor %55 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %2266 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_2323, %2265) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_2324 = tensor.cast %2266 : tensor to tensor<4x1x3200xf32> %2267 = torch_c.from_builtin_tensor %cast_2324 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_2325 = torch.constant.int 1 %2268 = torch.aten.add.Tensor %2246, %2267, %int1_2325 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_2326 = torch.constant.int 2 %2269 = torch.aten.pow.Tensor_Scalar %2268, %int2_2326 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_2327 = torch.constant.int -1 %2270 = torch.prim.ListConstruct %int-1_2327 : (!torch.int) -> !torch.list %true_2328 = torch.constant.bool true %none_2329 = torch.constant.none %2271 = torch.aten.mean.dim %2269, %2270, %true_2328, %none_2329 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_2330 = torch.constant.float 9.9999999747524271E-7 %int1_2331 = torch.constant.int 1 %2272 = torch.aten.add.Scalar %2271, %float9.999990e-07_2330, %int1_2331 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %2273 = torch.aten.rsqrt %2272 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %2274 = torch.aten.mul.Tensor %2268, %2273 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %2275 = torch.aten.mul.Tensor %2274, %56 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %2276 = torch_c.to_builtin_tensor %2275 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2332 = tensor.cast %2276 : tensor<4x1x3200xf32> to tensor %2277 = torch_c.to_builtin_tensor %57 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2278 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_2332, %2277) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_2333 = tensor.cast %2278 : tensor to tensor<4x1x3200xf32> %2279 = torch_c.from_builtin_tensor %cast_2333 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %2280 = torch_c.to_builtin_tensor %2275 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2334 = tensor.cast %2280 : tensor<4x1x3200xf32> to tensor %2281 = torch_c.to_builtin_tensor %58 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2282 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_2334, %2281) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_2335 = tensor.cast %2282 : tensor to tensor<4x1x3200xf32> %2283 = torch_c.from_builtin_tensor %cast_2335 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %2284 = torch_c.to_builtin_tensor %2275 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2336 = tensor.cast %2284 : tensor<4x1x3200xf32> to tensor %2285 = torch_c.to_builtin_tensor %59 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2286 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_2336, %2285) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_2337 = tensor.cast %2286 : tensor to tensor<4x1x3200xf32> %2287 = torch_c.from_builtin_tensor %cast_2337 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_2338 = torch.constant.int 4 %int1_2339 = torch.constant.int 1 %int32_2340 = torch.constant.int 32 %int100_2341 = torch.constant.int 100 %2288 = torch.prim.ListConstruct %int4_2338, %int1_2339, %int32_2340, %int100_2341 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2289 = torch.aten.view %2279, %2288 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_2342 = torch.constant.int 4 %int1_2343 = torch.constant.int 1 %int32_2344 = torch.constant.int 32 %int100_2345 = torch.constant.int 100 %2290 = torch.prim.ListConstruct %int4_2342, %int1_2343, %int32_2344, %int100_2345 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2291 = torch.aten.view %2283, %2290 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_2346 = torch.constant.int 4 %int1_2347 = torch.constant.int 1 %int32_2348 = torch.constant.int 32 %int100_2349 = torch.constant.int 100 %2292 = torch.prim.ListConstruct %int4_2346, %int1_2347, %int32_2348, %int100_2349 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2293 = torch.aten.view %2287, %2292 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_2350 = torch.constant.int 4 %int1_2351 = torch.constant.int 1 %int32_2352 = torch.constant.int 32 %int-1_2353 = torch.constant.int -1 %int2_2354 = torch.constant.int 2 %2294 = torch.prim.ListConstruct %int4_2350, %int1_2351, %int32_2352, %int-1_2353, %int2_2354 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2295 = torch.aten.view %2289, %2294 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %2296 = torch.aten.view_as_complex %2295 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_2355 = torch.constant.int 4 %int1_2356 = torch.constant.int 1 %int32_2357 = torch.constant.int 32 %int-1_2358 = torch.constant.int -1 %int2_2359 = torch.constant.int 2 %2297 = torch.prim.ListConstruct %int4_2355, %int1_2356, %int32_2357, %int-1_2358, %int2_2359 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2298 = torch.aten.view %2291, %2297 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %2299 = torch.aten.view_as_complex %2298 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %2300 = torch.aten.mul.Tensor %2296, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %2301 = torch.aten.view_as_real %2300 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_2360 = torch.constant.int 4 %int1_2361 = torch.constant.int 1 %int32_2362 = torch.constant.int 32 %int100_2363 = torch.constant.int 100 %2302 = torch.prim.ListConstruct %int4_2360, %int1_2361, %int32_2362, %int100_2363 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2303 = torch.aten.view %2301, %2302 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %2304 = torch.aten.mul.Tensor %2299, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %2305 = torch.aten.view_as_real %2304 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_2364 = torch.constant.int 4 %int1_2365 = torch.constant.int 1 %int32_2366 = torch.constant.int 32 %int100_2367 = torch.constant.int 100 %2306 = torch.prim.ListConstruct %int4_2364, %int1_2365, %int32_2366, %int100_2367 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2307 = torch.aten.view %2305, %2306 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_2368 = torch.constant.int 1 %int1_2369 = torch.constant.int 1 %2308 = torch.aten.add.Scalar %arg2, %int1_2368, %int1_2369 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_2370 = torch.constant.int 0 %int0_2371 = torch.constant.int 0 %2309 = torch.aten.select.int %2308, %int0_2370, %int0_2371 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2372 = torch.constant.int 0 %int0_2373 = torch.constant.int 0 %2310 = torch.aten.select.int %arg3, %int0_2372, %int0_2373 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2374 = torch.constant.int 0 %int0_2375 = torch.constant.int 0 %int9223372036854775807_2376 = torch.constant.int 9223372036854775807 %int1_2377 = torch.constant.int 1 %2311 = torch.aten.slice.Tensor %2310, %int0_2374, %int0_2375, %int9223372036854775807_2376, %int1_2377 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2378 = torch.constant.int 16 %2312 = torch.aten.floor_divide.Scalar %2309, %int16_2378 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2379 = torch.constant.int 0 %2313 = torch.aten.index_select %2311, %int0_2379, %2312 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2380 = torch.constant.int 16 %2314 = torch.aten.remainder.Scalar %2309, %int16_2380 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2381 = torch.constant.none %2315 = torch.aten.clone %334, %none_2381 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2382 = torch.constant.none %2316 = torch.aten.clone %335, %none_2382 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2383 = torch.constant.int 0 %2317 = torch.aten.unsqueeze %2314, %int0_2383 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2384 = torch.constant.int 0 %int0_2385 = torch.constant.int 0 %2318 = torch.aten.select.int %2307, %int0_2384, %int0_2385 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2386 = torch.constant.int 0 %int0_2387 = torch.constant.int 0 %2319 = torch.aten.select.int %2318, %int0_2386, %int0_2387 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_2388 = torch.constant.int -1 %int26_2389 = torch.constant.int 26 %int2_2390 = torch.constant.int 2 %int16_2391 = torch.constant.int 16 %int32_2392 = torch.constant.int 32 %int100_2393 = torch.constant.int 100 %2320 = torch.prim.ListConstruct %int-1_2388, %int26_2389, %int2_2390, %int16_2391, %int32_2392, %int100_2393 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2321 = torch.aten.view %2155, %2320 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %2322 = torch.prim.ListConstruct %2313, %2315, %2316, %2317 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2394 = torch.constant.bool false %2323 = torch.aten.index_put %2321, %2322, %2319, %false_2394 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2395 = torch.constant.int 2662400 %2324 = torch.prim.ListConstruct %731, %int2662400_2395 : (!torch.int, !torch.int) -> !torch.list %2325 = torch.aten.view %2323, %2324 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2396 = torch.constant.int -1 %int26_2397 = torch.constant.int 26 %int2_2398 = torch.constant.int 2 %int16_2399 = torch.constant.int 16 %int32_2400 = torch.constant.int 32 %int100_2401 = torch.constant.int 100 %2326 = torch.prim.ListConstruct %int-1_2396, %int26_2397, %int2_2398, %int16_2399, %int32_2400, %int100_2401 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2327 = torch.aten.view %2325, %2326 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2402 = torch.constant.none %2328 = torch.aten.clone %336, %none_2402 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2403 = torch.constant.none %2329 = torch.aten.clone %337, %none_2403 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2404 = torch.constant.int 0 %2330 = torch.aten.unsqueeze %2314, %int0_2404 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2405 = torch.constant.int 0 %int0_2406 = torch.constant.int 0 %2331 = torch.aten.select.int %2293, %int0_2405, %int0_2406 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2407 = torch.constant.int 0 %int0_2408 = torch.constant.int 0 %2332 = torch.aten.select.int %2331, %int0_2407, %int0_2408 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2333 = torch.prim.ListConstruct %2313, %2328, %2329, %2330 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2409 = torch.constant.bool false %2334 = torch.aten.index_put %2327, %2333, %2332, %false_2409 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2410 = torch.constant.int 2662400 %2335 = torch.prim.ListConstruct %731, %int2662400_2410 : (!torch.int, !torch.int) -> !torch.list %2336 = torch.aten.view %2334, %2335 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2411 = torch.constant.int -1 %int26_2412 = torch.constant.int 26 %int2_2413 = torch.constant.int 2 %int16_2414 = torch.constant.int 16 %int32_2415 = torch.constant.int 32 %int100_2416 = torch.constant.int 100 %2337 = torch.prim.ListConstruct %int-1_2411, %int26_2412, %int2_2413, %int16_2414, %int32_2415, %int100_2416 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2338 = torch.aten.view %2336, %2337 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_2417 = torch.constant.int 0 %int1_2418 = torch.constant.int 1 %2339 = torch.aten.select.int %2308, %int0_2417, %int1_2418 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2419 = torch.constant.int 0 %int1_2420 = torch.constant.int 1 %2340 = torch.aten.select.int %arg3, %int0_2419, %int1_2420 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2421 = torch.constant.int 0 %int0_2422 = torch.constant.int 0 %int9223372036854775807_2423 = torch.constant.int 9223372036854775807 %int1_2424 = torch.constant.int 1 %2341 = torch.aten.slice.Tensor %2340, %int0_2421, %int0_2422, %int9223372036854775807_2423, %int1_2424 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2425 = torch.constant.int 16 %2342 = torch.aten.floor_divide.Scalar %2339, %int16_2425 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2426 = torch.constant.int 0 %2343 = torch.aten.index_select %2341, %int0_2426, %2342 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2427 = torch.constant.int 16 %2344 = torch.aten.remainder.Scalar %2339, %int16_2427 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2428 = torch.constant.none %2345 = torch.aten.clone %338, %none_2428 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2429 = torch.constant.none %2346 = torch.aten.clone %339, %none_2429 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2430 = torch.constant.int 0 %2347 = torch.aten.unsqueeze %2344, %int0_2430 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2431 = torch.constant.int 0 %int1_2432 = torch.constant.int 1 %2348 = torch.aten.select.int %2307, %int0_2431, %int1_2432 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2433 = torch.constant.int 0 %int0_2434 = torch.constant.int 0 %2349 = torch.aten.select.int %2348, %int0_2433, %int0_2434 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2350 = torch.prim.ListConstruct %2343, %2345, %2346, %2347 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2435 = torch.constant.bool false %2351 = torch.aten.index_put %2338, %2350, %2349, %false_2435 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2436 = torch.constant.int 2662400 %2352 = torch.prim.ListConstruct %731, %int2662400_2436 : (!torch.int, !torch.int) -> !torch.list %2353 = torch.aten.view %2351, %2352 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2437 = torch.constant.int -1 %int26_2438 = torch.constant.int 26 %int2_2439 = torch.constant.int 2 %int16_2440 = torch.constant.int 16 %int32_2441 = torch.constant.int 32 %int100_2442 = torch.constant.int 100 %2354 = torch.prim.ListConstruct %int-1_2437, %int26_2438, %int2_2439, %int16_2440, %int32_2441, %int100_2442 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2355 = torch.aten.view %2353, %2354 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2443 = torch.constant.none %2356 = torch.aten.clone %340, %none_2443 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2444 = torch.constant.none %2357 = torch.aten.clone %341, %none_2444 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2445 = torch.constant.int 0 %2358 = torch.aten.unsqueeze %2344, %int0_2445 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2446 = torch.constant.int 0 %int1_2447 = torch.constant.int 1 %2359 = torch.aten.select.int %2293, %int0_2446, %int1_2447 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2448 = torch.constant.int 0 %int0_2449 = torch.constant.int 0 %2360 = torch.aten.select.int %2359, %int0_2448, %int0_2449 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2361 = torch.prim.ListConstruct %2343, %2356, %2357, %2358 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2450 = torch.constant.bool false %2362 = torch.aten.index_put %2355, %2361, %2360, %false_2450 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2451 = torch.constant.int 2662400 %2363 = torch.prim.ListConstruct %731, %int2662400_2451 : (!torch.int, !torch.int) -> !torch.list %2364 = torch.aten.view %2362, %2363 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2452 = torch.constant.int -1 %int26_2453 = torch.constant.int 26 %int2_2454 = torch.constant.int 2 %int16_2455 = torch.constant.int 16 %int32_2456 = torch.constant.int 32 %int100_2457 = torch.constant.int 100 %2365 = torch.prim.ListConstruct %int-1_2452, %int26_2453, %int2_2454, %int16_2455, %int32_2456, %int100_2457 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2366 = torch.aten.view %2364, %2365 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_2458 = torch.constant.int 0 %int2_2459 = torch.constant.int 2 %2367 = torch.aten.select.int %2308, %int0_2458, %int2_2459 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2460 = torch.constant.int 0 %int2_2461 = torch.constant.int 2 %2368 = torch.aten.select.int %arg3, %int0_2460, %int2_2461 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2462 = torch.constant.int 0 %int0_2463 = torch.constant.int 0 %int9223372036854775807_2464 = torch.constant.int 9223372036854775807 %int1_2465 = torch.constant.int 1 %2369 = torch.aten.slice.Tensor %2368, %int0_2462, %int0_2463, %int9223372036854775807_2464, %int1_2465 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2466 = torch.constant.int 16 %2370 = torch.aten.floor_divide.Scalar %2367, %int16_2466 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2467 = torch.constant.int 0 %2371 = torch.aten.index_select %2369, %int0_2467, %2370 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2468 = torch.constant.int 16 %2372 = torch.aten.remainder.Scalar %2367, %int16_2468 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2469 = torch.constant.none %2373 = torch.aten.clone %342, %none_2469 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2470 = torch.constant.none %2374 = torch.aten.clone %343, %none_2470 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2471 = torch.constant.int 0 %2375 = torch.aten.unsqueeze %2372, %int0_2471 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2472 = torch.constant.int 0 %int2_2473 = torch.constant.int 2 %2376 = torch.aten.select.int %2307, %int0_2472, %int2_2473 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2474 = torch.constant.int 0 %int0_2475 = torch.constant.int 0 %2377 = torch.aten.select.int %2376, %int0_2474, %int0_2475 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2378 = torch.prim.ListConstruct %2371, %2373, %2374, %2375 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2476 = torch.constant.bool false %2379 = torch.aten.index_put %2366, %2378, %2377, %false_2476 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2477 = torch.constant.int 2662400 %2380 = torch.prim.ListConstruct %731, %int2662400_2477 : (!torch.int, !torch.int) -> !torch.list %2381 = torch.aten.view %2379, %2380 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2478 = torch.constant.int -1 %int26_2479 = torch.constant.int 26 %int2_2480 = torch.constant.int 2 %int16_2481 = torch.constant.int 16 %int32_2482 = torch.constant.int 32 %int100_2483 = torch.constant.int 100 %2382 = torch.prim.ListConstruct %int-1_2478, %int26_2479, %int2_2480, %int16_2481, %int32_2482, %int100_2483 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2383 = torch.aten.view %2381, %2382 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2484 = torch.constant.none %2384 = torch.aten.clone %344, %none_2484 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2485 = torch.constant.none %2385 = torch.aten.clone %345, %none_2485 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2486 = torch.constant.int 0 %2386 = torch.aten.unsqueeze %2372, %int0_2486 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2487 = torch.constant.int 0 %int2_2488 = torch.constant.int 2 %2387 = torch.aten.select.int %2293, %int0_2487, %int2_2488 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2489 = torch.constant.int 0 %int0_2490 = torch.constant.int 0 %2388 = torch.aten.select.int %2387, %int0_2489, %int0_2490 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2389 = torch.prim.ListConstruct %2371, %2384, %2385, %2386 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2491 = torch.constant.bool false %2390 = torch.aten.index_put %2383, %2389, %2388, %false_2491 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2492 = torch.constant.int 2662400 %2391 = torch.prim.ListConstruct %731, %int2662400_2492 : (!torch.int, !torch.int) -> !torch.list %2392 = torch.aten.view %2390, %2391 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2493 = torch.constant.int -1 %int26_2494 = torch.constant.int 26 %int2_2495 = torch.constant.int 2 %int16_2496 = torch.constant.int 16 %int32_2497 = torch.constant.int 32 %int100_2498 = torch.constant.int 100 %2393 = torch.prim.ListConstruct %int-1_2493, %int26_2494, %int2_2495, %int16_2496, %int32_2497, %int100_2498 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2394 = torch.aten.view %2392, %2393 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_2499 = torch.constant.int 0 %int3_2500 = torch.constant.int 3 %2395 = torch.aten.select.int %2308, %int0_2499, %int3_2500 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2501 = torch.constant.int 0 %int3_2502 = torch.constant.int 3 %2396 = torch.aten.select.int %arg3, %int0_2501, %int3_2502 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2503 = torch.constant.int 0 %int0_2504 = torch.constant.int 0 %int9223372036854775807_2505 = torch.constant.int 9223372036854775807 %int1_2506 = torch.constant.int 1 %2397 = torch.aten.slice.Tensor %2396, %int0_2503, %int0_2504, %int9223372036854775807_2505, %int1_2506 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2507 = torch.constant.int 16 %2398 = torch.aten.floor_divide.Scalar %2395, %int16_2507 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2508 = torch.constant.int 0 %2399 = torch.aten.index_select %2397, %int0_2508, %2398 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2509 = torch.constant.int 16 %2400 = torch.aten.remainder.Scalar %2395, %int16_2509 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2510 = torch.constant.none %2401 = torch.aten.clone %346, %none_2510 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2511 = torch.constant.none %2402 = torch.aten.clone %347, %none_2511 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2512 = torch.constant.int 0 %2403 = torch.aten.unsqueeze %2400, %int0_2512 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2513 = torch.constant.int 0 %int3_2514 = torch.constant.int 3 %2404 = torch.aten.select.int %2307, %int0_2513, %int3_2514 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2515 = torch.constant.int 0 %int0_2516 = torch.constant.int 0 %2405 = torch.aten.select.int %2404, %int0_2515, %int0_2516 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2406 = torch.prim.ListConstruct %2399, %2401, %2402, %2403 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2517 = torch.constant.bool false %2407 = torch.aten.index_put %2394, %2406, %2405, %false_2517 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2518 = torch.constant.int 2662400 %2408 = torch.prim.ListConstruct %731, %int2662400_2518 : (!torch.int, !torch.int) -> !torch.list %2409 = torch.aten.view %2407, %2408 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2519 = torch.constant.int -1 %int26_2520 = torch.constant.int 26 %int2_2521 = torch.constant.int 2 %int16_2522 = torch.constant.int 16 %int32_2523 = torch.constant.int 32 %int100_2524 = torch.constant.int 100 %2410 = torch.prim.ListConstruct %int-1_2519, %int26_2520, %int2_2521, %int16_2522, %int32_2523, %int100_2524 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2411 = torch.aten.view %2409, %2410 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2525 = torch.constant.none %2412 = torch.aten.clone %348, %none_2525 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2526 = torch.constant.none %2413 = torch.aten.clone %349, %none_2526 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2527 = torch.constant.int 0 %2414 = torch.aten.unsqueeze %2400, %int0_2527 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2528 = torch.constant.int 0 %int3_2529 = torch.constant.int 3 %2415 = torch.aten.select.int %2293, %int0_2528, %int3_2529 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2530 = torch.constant.int 0 %int0_2531 = torch.constant.int 0 %2416 = torch.aten.select.int %2415, %int0_2530, %int0_2531 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2417 = torch.prim.ListConstruct %2399, %2412, %2413, %2414 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2532 = torch.constant.bool false %2418 = torch.aten.index_put %2411, %2417, %2416, %false_2532 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2533 = torch.constant.int 2662400 %2419 = torch.prim.ListConstruct %731, %int2662400_2533 : (!torch.int, !torch.int) -> !torch.list %2420 = torch.aten.view %2418, %2419 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_2534 = torch.constant.int 52 %2421 = torch.aten.mul.Scalar %arg3, %int52_2534 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int12 = torch.constant.int 12 %int1_2535 = torch.constant.int 1 %2422 = torch.aten.add.Scalar %2421, %int12, %int1_2535 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_2536 = torch.constant.int 4 %2423 = torch.aten.mul.int %int4_2536, %655 : !torch.int, !torch.int -> !torch.int %2424 = torch.prim.ListConstruct %2423 : (!torch.int) -> !torch.list %2425 = torch.aten.view %2422, %2424 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_2537 = torch.constant.int -1 %int26_2538 = torch.constant.int 26 %int2_2539 = torch.constant.int 2 %int16_2540 = torch.constant.int 16 %int32_2541 = torch.constant.int 32 %int100_2542 = torch.constant.int 100 %2426 = torch.prim.ListConstruct %int-1_2537, %int26_2538, %int2_2539, %int16_2540, %int32_2541, %int100_2542 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2427 = torch.aten.view %2420, %2426 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_2543 = torch.constant.int 26 %2428 = torch.aten.mul.int %731, %int26_2543 : !torch.int, !torch.int -> !torch.int %int2_2544 = torch.constant.int 2 %2429 = torch.aten.mul.int %2428, %int2_2544 : !torch.int, !torch.int -> !torch.int %int16_2545 = torch.constant.int 16 %int32_2546 = torch.constant.int 32 %int100_2547 = torch.constant.int 100 %2430 = torch.prim.ListConstruct %2429, %int16_2545, %int32_2546, %int100_2547 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2431 = torch.aten.view %2427, %2430 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_2548 = torch.constant.int 0 %2432 = torch.aten.index_select %2431, %int0_2548, %2425 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_2549 = torch.constant.int 4 %int16_2550 = torch.constant.int 16 %int32_2551 = torch.constant.int 32 %int100_2552 = torch.constant.int 100 %2433 = torch.prim.ListConstruct %int4_2549, %655, %int16_2550, %int32_2551, %int100_2552 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2434 = torch.aten.view %2432, %2433 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_2553 = torch.constant.int 1 %2435 = torch.aten.size.int %2434, %int1_2553 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_2554 = torch.constant.int 16 %2436 = torch.aten.mul.int %2435, %int16_2554 : !torch.int, !torch.int -> !torch.int %int4_2555 = torch.constant.int 4 %int32_2556 = torch.constant.int 32 %int100_2557 = torch.constant.int 100 %2437 = torch.prim.ListConstruct %int4_2555, %2436, %int32_2556, %int100_2557 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2438 = torch.aten.view %2434, %2437 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_2558 = torch.constant.int 0 %int0_2559 = torch.constant.int 0 %int9223372036854775807_2560 = torch.constant.int 9223372036854775807 %int1_2561 = torch.constant.int 1 %2439 = torch.aten.slice.Tensor %2180, %int0_2558, %int0_2559, %int9223372036854775807_2560, %int1_2561 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_2562 = torch.constant.int 16 %2440 = torch.aten.mul.int %655, %int16_2562 : !torch.int, !torch.int -> !torch.int %int1_2563 = torch.constant.int 1 %int0_2564 = torch.constant.int 0 %int1_2565 = torch.constant.int 1 %2441 = torch.aten.slice.Tensor %2439, %int1_2563, %int0_2564, %2440, %int1_2565 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_2566 = torch.constant.bool false %2442 = torch.aten.copy %2441, %2438, %false_2566 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_2567 = torch.constant.int 0 %int0_2568 = torch.constant.int 0 %int9223372036854775807_2569 = torch.constant.int 9223372036854775807 %int1_2570 = torch.constant.int 1 %2443 = torch.aten.slice.Tensor %2180, %int0_2567, %int0_2568, %int9223372036854775807_2569, %int1_2570 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2571 = torch.constant.int 1 %int0_2572 = torch.constant.int 0 %int1_2573 = torch.constant.int 1 %2444 = torch.aten.slice_scatter %2443, %2442, %int1_2571, %int0_2572, %2440, %int1_2573 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_2574 = torch.constant.int 0 %int0_2575 = torch.constant.int 0 %int9223372036854775807_2576 = torch.constant.int 9223372036854775807 %int1_2577 = torch.constant.int 1 %2445 = torch.aten.slice_scatter %2180, %2444, %int0_2574, %int0_2575, %int9223372036854775807_2576, %int1_2577 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2578 = torch.constant.int 1 %int1_2579 = torch.constant.int 1 %2446 = torch.aten.add.Scalar %2422, %int1_2578, %int1_2579 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_2580 = torch.constant.int 4 %2447 = torch.aten.mul.int %int4_2580, %655 : !torch.int, !torch.int -> !torch.int %2448 = torch.prim.ListConstruct %2447 : (!torch.int) -> !torch.list %2449 = torch.aten.view %2446, %2448 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_2581 = torch.constant.int 0 %2450 = torch.aten.index_select %2431, %int0_2581, %2449 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_2582 = torch.constant.int 4 %int16_2583 = torch.constant.int 16 %int32_2584 = torch.constant.int 32 %int100_2585 = torch.constant.int 100 %2451 = torch.prim.ListConstruct %int4_2582, %655, %int16_2583, %int32_2584, %int100_2585 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2452 = torch.aten.view %2450, %2451 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_2586 = torch.constant.int 1 %2453 = torch.aten.size.int %2452, %int1_2586 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_2587 = torch.constant.int 16 %2454 = torch.aten.mul.int %2453, %int16_2587 : !torch.int, !torch.int -> !torch.int %int4_2588 = torch.constant.int 4 %int32_2589 = torch.constant.int 32 %int100_2590 = torch.constant.int 100 %2455 = torch.prim.ListConstruct %int4_2588, %2454, %int32_2589, %int100_2590 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2456 = torch.aten.view %2452, %2455 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_2591 = torch.constant.int 0 %int0_2592 = torch.constant.int 0 %int9223372036854775807_2593 = torch.constant.int 9223372036854775807 %int1_2594 = torch.constant.int 1 %2457 = torch.aten.slice.Tensor %2197, %int0_2591, %int0_2592, %int9223372036854775807_2593, %int1_2594 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2595 = torch.constant.int 1 %int0_2596 = torch.constant.int 0 %int1_2597 = torch.constant.int 1 %2458 = torch.aten.slice.Tensor %2457, %int1_2595, %int0_2596, %2440, %int1_2597 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_2598 = torch.constant.bool false %2459 = torch.aten.copy %2458, %2456, %false_2598 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_2599 = torch.constant.int 0 %int0_2600 = torch.constant.int 0 %int9223372036854775807_2601 = torch.constant.int 9223372036854775807 %int1_2602 = torch.constant.int 1 %2460 = torch.aten.slice.Tensor %2197, %int0_2599, %int0_2600, %int9223372036854775807_2601, %int1_2602 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2603 = torch.constant.int 1 %int0_2604 = torch.constant.int 0 %int1_2605 = torch.constant.int 1 %2461 = torch.aten.slice_scatter %2460, %2459, %int1_2603, %int0_2604, %2440, %int1_2605 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_2606 = torch.constant.int 0 %int0_2607 = torch.constant.int 0 %int9223372036854775807_2608 = torch.constant.int 9223372036854775807 %int1_2609 = torch.constant.int 1 %2462 = torch.aten.slice_scatter %2197, %2461, %int0_2606, %int0_2607, %int9223372036854775807_2608, %int1_2609 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_2610 = torch.constant.int 0 %int0_2611 = torch.constant.int 0 %int9223372036854775807_2612 = torch.constant.int 9223372036854775807 %int1_2613 = torch.constant.int 1 %2463 = torch.aten.slice.Tensor %671, %int0_2610, %int0_2611, %int9223372036854775807_2612, %int1_2613 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2614 = torch.constant.int 1 %int0_2615 = torch.constant.int 0 %int1_2616 = torch.constant.int 1 %2464 = torch.aten.slice.Tensor %2463, %int1_2614, %int0_2615, %2440, %int1_2616 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_2617 = torch.constant.int 0 %int0_2618 = torch.constant.int 0 %int9223372036854775807_2619 = torch.constant.int 9223372036854775807 %int1_2620 = torch.constant.int 1 %2465 = torch.aten.slice.Tensor %673, %int0_2617, %int0_2618, %int9223372036854775807_2619, %int1_2620 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2621 = torch.constant.int 1 %int0_2622 = torch.constant.int 0 %int1_2623 = torch.constant.int 1 %2466 = torch.aten.slice.Tensor %2465, %int1_2621, %int0_2622, %2440, %int1_2623 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_2624 = torch.constant.int 1 %int2_2625 = torch.constant.int 2 %2467 = torch.aten.transpose.int %2303, %int1_2624, %int2_2625 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_2626 = torch.constant.int 4 %int32_2627 = torch.constant.int 32 %int1_2628 = torch.constant.int 1 %int100_2629 = torch.constant.int 100 %2468 = torch.prim.ListConstruct %int4_2626, %int32_2627, %int1_2628, %int100_2629 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_2630 = torch.constant.bool false %2469 = torch.aten.expand %2467, %2468, %false_2630 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_2631 = torch.constant.int 128 %int1_2632 = torch.constant.int 1 %int100_2633 = torch.constant.int 100 %2470 = torch.prim.ListConstruct %int128_2631, %int1_2632, %int100_2633 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2471 = torch.aten.view %2469, %2470 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_2634 = torch.constant.int 0 %int0_2635 = torch.constant.int 0 %int9223372036854775807_2636 = torch.constant.int 9223372036854775807 %int1_2637 = torch.constant.int 1 %2472 = torch.aten.slice.Tensor %2445, %int0_2634, %int0_2635, %int9223372036854775807_2636, %int1_2637 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2638 = torch.constant.int 1 %int0_2639 = torch.constant.int 0 %int1_2640 = torch.constant.int 1 %2473 = torch.aten.slice.Tensor %2472, %int1_2638, %int0_2639, %2440, %int1_2640 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_2641 = torch.constant.int 1 %int2_2642 = torch.constant.int 2 %2474 = torch.aten.transpose.int %2473, %int1_2641, %int2_2642 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_2643 = torch.constant.int 2 %int3_2644 = torch.constant.int 3 %2475 = torch.aten.transpose.int %2474, %int2_2643, %int3_2644 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_2645 = torch.constant.int 1 %2476 = torch.aten.size.int %2464, %int1_2645 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_2646 = torch.constant.int 4 %int32_2647 = torch.constant.int 32 %int100_2648 = torch.constant.int 100 %2477 = torch.prim.ListConstruct %int4_2646, %int32_2647, %int100_2648, %2476 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_2649 = torch.constant.bool false %2478 = torch.aten.expand %2475, %2477, %false_2649 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_2650 = torch.constant.int 0 %2479 = torch.aten.clone %2478, %int0_2650 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_2651 = torch.constant.int 128 %int100_2652 = torch.constant.int 100 %2480 = torch.prim.ListConstruct %int128_2651, %int100_2652, %2476 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2481 = torch.aten._unsafe_view %2479, %2480 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %2482 = torch.aten.bmm %2471, %2481 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_2653 = torch.constant.int 4 %int32_2654 = torch.constant.int 32 %int1_2655 = torch.constant.int 1 %2483 = torch.prim.ListConstruct %int4_2653, %int32_2654, %int1_2655, %2476 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2484 = torch.aten.view %2482, %2483 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_2656 = torch.constant.float 1.000000e+01 %2485 = torch.aten.div.Scalar %2484, %float1.000000e01_2656 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_2657 = torch.constant.int 1 %2486 = torch.aten.add.Tensor %2485, %895, %int1_2657 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_2658 = torch.constant.int -1 %false_2659 = torch.constant.bool false %2487 = torch.aten._softmax %2486, %int-1_2658, %false_2659 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_2660 = torch.constant.int 4 %int32_2661 = torch.constant.int 32 %int1_2662 = torch.constant.int 1 %2488 = torch.prim.ListConstruct %int4_2660, %int32_2661, %int1_2662, %2476 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_2663 = torch.constant.bool false %2489 = torch.aten.expand %2487, %2488, %false_2663 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_2664 = torch.constant.int 128 %int1_2665 = torch.constant.int 1 %2490 = torch.prim.ListConstruct %int128_2664, %int1_2665, %2476 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2491 = torch.aten.view %2489, %2490 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_2666 = torch.constant.int 0 %int0_2667 = torch.constant.int 0 %int9223372036854775807_2668 = torch.constant.int 9223372036854775807 %int1_2669 = torch.constant.int 1 %2492 = torch.aten.slice.Tensor %2462, %int0_2666, %int0_2667, %int9223372036854775807_2668, %int1_2669 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2670 = torch.constant.int 1 %int0_2671 = torch.constant.int 0 %int1_2672 = torch.constant.int 1 %2493 = torch.aten.slice.Tensor %2492, %int1_2670, %int0_2671, %2440, %int1_2672 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_2673 = torch.constant.int 1 %int2_2674 = torch.constant.int 2 %2494 = torch.aten.transpose.int %2493, %int1_2673, %int2_2674 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_2675 = torch.constant.int 1 %2495 = torch.aten.size.int %2466, %int1_2675 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_2676 = torch.constant.int 4 %int32_2677 = torch.constant.int 32 %int100_2678 = torch.constant.int 100 %2496 = torch.prim.ListConstruct %int4_2676, %int32_2677, %2495, %int100_2678 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_2679 = torch.constant.bool false %2497 = torch.aten.expand %2494, %2496, %false_2679 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_2680 = torch.constant.int 0 %2498 = torch.aten.clone %2497, %int0_2680 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_2681 = torch.constant.int 128 %int100_2682 = torch.constant.int 100 %2499 = torch.prim.ListConstruct %int128_2681, %2495, %int100_2682 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2500 = torch.aten._unsafe_view %2498, %2499 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %2501 = torch.aten.bmm %2491, %2500 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_2683 = torch.constant.int 4 %int32_2684 = torch.constant.int 32 %int1_2685 = torch.constant.int 1 %int100_2686 = torch.constant.int 100 %2502 = torch.prim.ListConstruct %int4_2683, %int32_2684, %int1_2685, %int100_2686 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2503 = torch.aten.view %2501, %2502 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_2687 = torch.constant.int 1 %int2_2688 = torch.constant.int 2 %2504 = torch.aten.transpose.int %2503, %int1_2687, %int2_2688 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_2689 = torch.constant.int 4 %int1_2690 = torch.constant.int 1 %int-1_2691 = torch.constant.int -1 %2505 = torch.prim.ListConstruct %int4_2689, %int1_2690, %int-1_2691 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2506 = torch.aten.view %2504, %2505 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %2507 = torch_c.to_builtin_tensor %2506 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2692 = tensor.cast %2507 : tensor<4x1x3200xf32> to tensor %2508 = torch_c.to_builtin_tensor %60 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2509 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_2692, %2508) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_2693 = tensor.cast %2509 : tensor to tensor<4x1x3200xf32> %2510 = torch_c.from_builtin_tensor %cast_2693 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_2694 = torch.constant.int 1 %2511 = torch.aten.add.Tensor %2268, %2510, %int1_2694 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_2695 = torch.constant.int 2 %2512 = torch.aten.pow.Tensor_Scalar %2511, %int2_2695 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_2696 = torch.constant.int -1 %2513 = torch.prim.ListConstruct %int-1_2696 : (!torch.int) -> !torch.list %true_2697 = torch.constant.bool true %none_2698 = torch.constant.none %2514 = torch.aten.mean.dim %2512, %2513, %true_2697, %none_2698 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_2699 = torch.constant.float 9.9999999747524271E-7 %int1_2700 = torch.constant.int 1 %2515 = torch.aten.add.Scalar %2514, %float9.999990e-07_2699, %int1_2700 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %2516 = torch.aten.rsqrt %2515 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %2517 = torch.aten.mul.Tensor %2511, %2516 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %2518 = torch.aten.mul.Tensor %2517, %61 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %2519 = torch_c.to_builtin_tensor %2518 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2701 = tensor.cast %2519 : tensor<4x1x3200xf32> to tensor %2520 = torch_c.to_builtin_tensor %62 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %2521 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_2701, %2520) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_2702 = tensor.cast %2521 : tensor to tensor<4x1x8640xf32> %2522 = torch_c.from_builtin_tensor %cast_2702 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %2523 = torch.aten.silu %2522 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %2524 = torch_c.to_builtin_tensor %2518 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2703 = tensor.cast %2524 : tensor<4x1x3200xf32> to tensor %2525 = torch_c.to_builtin_tensor %63 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %2526 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_2703, %2525) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_2704 = tensor.cast %2526 : tensor to tensor<4x1x8640xf32> %2527 = torch_c.from_builtin_tensor %cast_2704 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %2528 = torch.aten.mul.Tensor %2523, %2527 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %2529 = torch_c.to_builtin_tensor %2528 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_2705 = tensor.cast %2529 : tensor<4x1x8640xf32> to tensor %2530 = torch_c.to_builtin_tensor %64 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %2531 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_2705, %2530) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_2706 = tensor.cast %2531 : tensor to tensor<4x1x3200xf32> %2532 = torch_c.from_builtin_tensor %cast_2706 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_2707 = torch.constant.int 1 %2533 = torch.aten.add.Tensor %2511, %2532, %int1_2707 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_2708 = torch.constant.int 2 %2534 = torch.aten.pow.Tensor_Scalar %2533, %int2_2708 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_2709 = torch.constant.int -1 %2535 = torch.prim.ListConstruct %int-1_2709 : (!torch.int) -> !torch.list %true_2710 = torch.constant.bool true %none_2711 = torch.constant.none %2536 = torch.aten.mean.dim %2534, %2535, %true_2710, %none_2711 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_2712 = torch.constant.float 9.9999999747524271E-7 %int1_2713 = torch.constant.int 1 %2537 = torch.aten.add.Scalar %2536, %float9.999990e-07_2712, %int1_2713 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %2538 = torch.aten.rsqrt %2537 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %2539 = torch.aten.mul.Tensor %2533, %2538 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %2540 = torch.aten.mul.Tensor %2539, %65 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %2541 = torch_c.to_builtin_tensor %2540 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2714 = tensor.cast %2541 : tensor<4x1x3200xf32> to tensor %2542 = torch_c.to_builtin_tensor %66 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2543 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_2714, %2542) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_2715 = tensor.cast %2543 : tensor to tensor<4x1x3200xf32> %2544 = torch_c.from_builtin_tensor %cast_2715 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %2545 = torch_c.to_builtin_tensor %2540 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2716 = tensor.cast %2545 : tensor<4x1x3200xf32> to tensor %2546 = torch_c.to_builtin_tensor %67 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2547 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_2716, %2546) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_2717 = tensor.cast %2547 : tensor to tensor<4x1x3200xf32> %2548 = torch_c.from_builtin_tensor %cast_2717 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %2549 = torch_c.to_builtin_tensor %2540 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_2718 = tensor.cast %2549 : tensor<4x1x3200xf32> to tensor %2550 = torch_c.to_builtin_tensor %68 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2551 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_2718, %2550) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_2719 = tensor.cast %2551 : tensor to tensor<4x1x3200xf32> %2552 = torch_c.from_builtin_tensor %cast_2719 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_2720 = torch.constant.int 4 %int1_2721 = torch.constant.int 1 %int32_2722 = torch.constant.int 32 %int100_2723 = torch.constant.int 100 %2553 = torch.prim.ListConstruct %int4_2720, %int1_2721, %int32_2722, %int100_2723 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2554 = torch.aten.view %2544, %2553 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_2724 = torch.constant.int 4 %int1_2725 = torch.constant.int 1 %int32_2726 = torch.constant.int 32 %int100_2727 = torch.constant.int 100 %2555 = torch.prim.ListConstruct %int4_2724, %int1_2725, %int32_2726, %int100_2727 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2556 = torch.aten.view %2548, %2555 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_2728 = torch.constant.int 4 %int1_2729 = torch.constant.int 1 %int32_2730 = torch.constant.int 32 %int100_2731 = torch.constant.int 100 %2557 = torch.prim.ListConstruct %int4_2728, %int1_2729, %int32_2730, %int100_2731 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2558 = torch.aten.view %2552, %2557 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_2732 = torch.constant.int 4 %int1_2733 = torch.constant.int 1 %int32_2734 = torch.constant.int 32 %int-1_2735 = torch.constant.int -1 %int2_2736 = torch.constant.int 2 %2559 = torch.prim.ListConstruct %int4_2732, %int1_2733, %int32_2734, %int-1_2735, %int2_2736 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2560 = torch.aten.view %2554, %2559 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %2561 = torch.aten.view_as_complex %2560 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_2737 = torch.constant.int 4 %int1_2738 = torch.constant.int 1 %int32_2739 = torch.constant.int 32 %int-1_2740 = torch.constant.int -1 %int2_2741 = torch.constant.int 2 %2562 = torch.prim.ListConstruct %int4_2737, %int1_2738, %int32_2739, %int-1_2740, %int2_2741 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2563 = torch.aten.view %2556, %2562 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %2564 = torch.aten.view_as_complex %2563 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %2565 = torch.aten.mul.Tensor %2561, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %2566 = torch.aten.view_as_real %2565 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_2742 = torch.constant.int 4 %int1_2743 = torch.constant.int 1 %int32_2744 = torch.constant.int 32 %int100_2745 = torch.constant.int 100 %2567 = torch.prim.ListConstruct %int4_2742, %int1_2743, %int32_2744, %int100_2745 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2568 = torch.aten.view %2566, %2567 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %2569 = torch.aten.mul.Tensor %2564, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %2570 = torch.aten.view_as_real %2569 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_2746 = torch.constant.int 4 %int1_2747 = torch.constant.int 1 %int32_2748 = torch.constant.int 32 %int100_2749 = torch.constant.int 100 %2571 = torch.prim.ListConstruct %int4_2746, %int1_2747, %int32_2748, %int100_2749 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2572 = torch.aten.view %2570, %2571 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_2750 = torch.constant.int 1 %int1_2751 = torch.constant.int 1 %2573 = torch.aten.add.Scalar %arg2, %int1_2750, %int1_2751 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_2752 = torch.constant.int 0 %int0_2753 = torch.constant.int 0 %2574 = torch.aten.select.int %2573, %int0_2752, %int0_2753 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2754 = torch.constant.int 0 %int0_2755 = torch.constant.int 0 %2575 = torch.aten.select.int %arg3, %int0_2754, %int0_2755 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2756 = torch.constant.int 0 %int0_2757 = torch.constant.int 0 %int9223372036854775807_2758 = torch.constant.int 9223372036854775807 %int1_2759 = torch.constant.int 1 %2576 = torch.aten.slice.Tensor %2575, %int0_2756, %int0_2757, %int9223372036854775807_2758, %int1_2759 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2760 = torch.constant.int 16 %2577 = torch.aten.floor_divide.Scalar %2574, %int16_2760 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2761 = torch.constant.int 0 %2578 = torch.aten.index_select %2576, %int0_2761, %2577 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2762 = torch.constant.int 16 %2579 = torch.aten.remainder.Scalar %2574, %int16_2762 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2763 = torch.constant.none %2580 = torch.aten.clone %350, %none_2763 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2764 = torch.constant.none %2581 = torch.aten.clone %351, %none_2764 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2765 = torch.constant.int 0 %2582 = torch.aten.unsqueeze %2579, %int0_2765 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2766 = torch.constant.int 0 %int0_2767 = torch.constant.int 0 %2583 = torch.aten.select.int %2572, %int0_2766, %int0_2767 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2768 = torch.constant.int 0 %int0_2769 = torch.constant.int 0 %2584 = torch.aten.select.int %2583, %int0_2768, %int0_2769 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_2770 = torch.constant.int -1 %int26_2771 = torch.constant.int 26 %int2_2772 = torch.constant.int 2 %int16_2773 = torch.constant.int 16 %int32_2774 = torch.constant.int 32 %int100_2775 = torch.constant.int 100 %2585 = torch.prim.ListConstruct %int-1_2770, %int26_2771, %int2_2772, %int16_2773, %int32_2774, %int100_2775 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2586 = torch.aten.view %2420, %2585 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %2587 = torch.prim.ListConstruct %2578, %2580, %2581, %2582 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2776 = torch.constant.bool false %2588 = torch.aten.index_put %2586, %2587, %2584, %false_2776 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2777 = torch.constant.int 2662400 %2589 = torch.prim.ListConstruct %731, %int2662400_2777 : (!torch.int, !torch.int) -> !torch.list %2590 = torch.aten.view %2588, %2589 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2778 = torch.constant.int -1 %int26_2779 = torch.constant.int 26 %int2_2780 = torch.constant.int 2 %int16_2781 = torch.constant.int 16 %int32_2782 = torch.constant.int 32 %int100_2783 = torch.constant.int 100 %2591 = torch.prim.ListConstruct %int-1_2778, %int26_2779, %int2_2780, %int16_2781, %int32_2782, %int100_2783 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2592 = torch.aten.view %2590, %2591 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2784 = torch.constant.none %2593 = torch.aten.clone %352, %none_2784 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2785 = torch.constant.none %2594 = torch.aten.clone %353, %none_2785 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2786 = torch.constant.int 0 %2595 = torch.aten.unsqueeze %2579, %int0_2786 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2787 = torch.constant.int 0 %int0_2788 = torch.constant.int 0 %2596 = torch.aten.select.int %2558, %int0_2787, %int0_2788 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2789 = torch.constant.int 0 %int0_2790 = torch.constant.int 0 %2597 = torch.aten.select.int %2596, %int0_2789, %int0_2790 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2598 = torch.prim.ListConstruct %2578, %2593, %2594, %2595 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2791 = torch.constant.bool false %2599 = torch.aten.index_put %2592, %2598, %2597, %false_2791 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2792 = torch.constant.int 2662400 %2600 = torch.prim.ListConstruct %731, %int2662400_2792 : (!torch.int, !torch.int) -> !torch.list %2601 = torch.aten.view %2599, %2600 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2793 = torch.constant.int -1 %int26_2794 = torch.constant.int 26 %int2_2795 = torch.constant.int 2 %int16_2796 = torch.constant.int 16 %int32_2797 = torch.constant.int 32 %int100_2798 = torch.constant.int 100 %2602 = torch.prim.ListConstruct %int-1_2793, %int26_2794, %int2_2795, %int16_2796, %int32_2797, %int100_2798 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2603 = torch.aten.view %2601, %2602 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_2799 = torch.constant.int 0 %int1_2800 = torch.constant.int 1 %2604 = torch.aten.select.int %2573, %int0_2799, %int1_2800 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2801 = torch.constant.int 0 %int1_2802 = torch.constant.int 1 %2605 = torch.aten.select.int %arg3, %int0_2801, %int1_2802 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2803 = torch.constant.int 0 %int0_2804 = torch.constant.int 0 %int9223372036854775807_2805 = torch.constant.int 9223372036854775807 %int1_2806 = torch.constant.int 1 %2606 = torch.aten.slice.Tensor %2605, %int0_2803, %int0_2804, %int9223372036854775807_2805, %int1_2806 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2807 = torch.constant.int 16 %2607 = torch.aten.floor_divide.Scalar %2604, %int16_2807 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2808 = torch.constant.int 0 %2608 = torch.aten.index_select %2606, %int0_2808, %2607 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2809 = torch.constant.int 16 %2609 = torch.aten.remainder.Scalar %2604, %int16_2809 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2810 = torch.constant.none %2610 = torch.aten.clone %354, %none_2810 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2811 = torch.constant.none %2611 = torch.aten.clone %355, %none_2811 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2812 = torch.constant.int 0 %2612 = torch.aten.unsqueeze %2609, %int0_2812 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2813 = torch.constant.int 0 %int1_2814 = torch.constant.int 1 %2613 = torch.aten.select.int %2572, %int0_2813, %int1_2814 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2815 = torch.constant.int 0 %int0_2816 = torch.constant.int 0 %2614 = torch.aten.select.int %2613, %int0_2815, %int0_2816 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2615 = torch.prim.ListConstruct %2608, %2610, %2611, %2612 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2817 = torch.constant.bool false %2616 = torch.aten.index_put %2603, %2615, %2614, %false_2817 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2818 = torch.constant.int 2662400 %2617 = torch.prim.ListConstruct %731, %int2662400_2818 : (!torch.int, !torch.int) -> !torch.list %2618 = torch.aten.view %2616, %2617 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2819 = torch.constant.int -1 %int26_2820 = torch.constant.int 26 %int2_2821 = torch.constant.int 2 %int16_2822 = torch.constant.int 16 %int32_2823 = torch.constant.int 32 %int100_2824 = torch.constant.int 100 %2619 = torch.prim.ListConstruct %int-1_2819, %int26_2820, %int2_2821, %int16_2822, %int32_2823, %int100_2824 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2620 = torch.aten.view %2618, %2619 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2825 = torch.constant.none %2621 = torch.aten.clone %356, %none_2825 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2826 = torch.constant.none %2622 = torch.aten.clone %357, %none_2826 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2827 = torch.constant.int 0 %2623 = torch.aten.unsqueeze %2609, %int0_2827 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2828 = torch.constant.int 0 %int1_2829 = torch.constant.int 1 %2624 = torch.aten.select.int %2558, %int0_2828, %int1_2829 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2830 = torch.constant.int 0 %int0_2831 = torch.constant.int 0 %2625 = torch.aten.select.int %2624, %int0_2830, %int0_2831 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2626 = torch.prim.ListConstruct %2608, %2621, %2622, %2623 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2832 = torch.constant.bool false %2627 = torch.aten.index_put %2620, %2626, %2625, %false_2832 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2833 = torch.constant.int 2662400 %2628 = torch.prim.ListConstruct %731, %int2662400_2833 : (!torch.int, !torch.int) -> !torch.list %2629 = torch.aten.view %2627, %2628 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2834 = torch.constant.int -1 %int26_2835 = torch.constant.int 26 %int2_2836 = torch.constant.int 2 %int16_2837 = torch.constant.int 16 %int32_2838 = torch.constant.int 32 %int100_2839 = torch.constant.int 100 %2630 = torch.prim.ListConstruct %int-1_2834, %int26_2835, %int2_2836, %int16_2837, %int32_2838, %int100_2839 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2631 = torch.aten.view %2629, %2630 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_2840 = torch.constant.int 0 %int2_2841 = torch.constant.int 2 %2632 = torch.aten.select.int %2573, %int0_2840, %int2_2841 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2842 = torch.constant.int 0 %int2_2843 = torch.constant.int 2 %2633 = torch.aten.select.int %arg3, %int0_2842, %int2_2843 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2844 = torch.constant.int 0 %int0_2845 = torch.constant.int 0 %int9223372036854775807_2846 = torch.constant.int 9223372036854775807 %int1_2847 = torch.constant.int 1 %2634 = torch.aten.slice.Tensor %2633, %int0_2844, %int0_2845, %int9223372036854775807_2846, %int1_2847 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2848 = torch.constant.int 16 %2635 = torch.aten.floor_divide.Scalar %2632, %int16_2848 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2849 = torch.constant.int 0 %2636 = torch.aten.index_select %2634, %int0_2849, %2635 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2850 = torch.constant.int 16 %2637 = torch.aten.remainder.Scalar %2632, %int16_2850 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2851 = torch.constant.none %2638 = torch.aten.clone %358, %none_2851 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2852 = torch.constant.none %2639 = torch.aten.clone %359, %none_2852 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2853 = torch.constant.int 0 %2640 = torch.aten.unsqueeze %2637, %int0_2853 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2854 = torch.constant.int 0 %int2_2855 = torch.constant.int 2 %2641 = torch.aten.select.int %2572, %int0_2854, %int2_2855 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2856 = torch.constant.int 0 %int0_2857 = torch.constant.int 0 %2642 = torch.aten.select.int %2641, %int0_2856, %int0_2857 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2643 = torch.prim.ListConstruct %2636, %2638, %2639, %2640 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2858 = torch.constant.bool false %2644 = torch.aten.index_put %2631, %2643, %2642, %false_2858 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2859 = torch.constant.int 2662400 %2645 = torch.prim.ListConstruct %731, %int2662400_2859 : (!torch.int, !torch.int) -> !torch.list %2646 = torch.aten.view %2644, %2645 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2860 = torch.constant.int -1 %int26_2861 = torch.constant.int 26 %int2_2862 = torch.constant.int 2 %int16_2863 = torch.constant.int 16 %int32_2864 = torch.constant.int 32 %int100_2865 = torch.constant.int 100 %2647 = torch.prim.ListConstruct %int-1_2860, %int26_2861, %int2_2862, %int16_2863, %int32_2864, %int100_2865 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2648 = torch.aten.view %2646, %2647 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2866 = torch.constant.none %2649 = torch.aten.clone %360, %none_2866 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2867 = torch.constant.none %2650 = torch.aten.clone %361, %none_2867 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2868 = torch.constant.int 0 %2651 = torch.aten.unsqueeze %2637, %int0_2868 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2869 = torch.constant.int 0 %int2_2870 = torch.constant.int 2 %2652 = torch.aten.select.int %2558, %int0_2869, %int2_2870 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2871 = torch.constant.int 0 %int0_2872 = torch.constant.int 0 %2653 = torch.aten.select.int %2652, %int0_2871, %int0_2872 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2654 = torch.prim.ListConstruct %2636, %2649, %2650, %2651 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2873 = torch.constant.bool false %2655 = torch.aten.index_put %2648, %2654, %2653, %false_2873 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2874 = torch.constant.int 2662400 %2656 = torch.prim.ListConstruct %731, %int2662400_2874 : (!torch.int, !torch.int) -> !torch.list %2657 = torch.aten.view %2655, %2656 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2875 = torch.constant.int -1 %int26_2876 = torch.constant.int 26 %int2_2877 = torch.constant.int 2 %int16_2878 = torch.constant.int 16 %int32_2879 = torch.constant.int 32 %int100_2880 = torch.constant.int 100 %2658 = torch.prim.ListConstruct %int-1_2875, %int26_2876, %int2_2877, %int16_2878, %int32_2879, %int100_2880 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2659 = torch.aten.view %2657, %2658 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_2881 = torch.constant.int 0 %int3_2882 = torch.constant.int 3 %2660 = torch.aten.select.int %2573, %int0_2881, %int3_2882 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_2883 = torch.constant.int 0 %int3_2884 = torch.constant.int 3 %2661 = torch.aten.select.int %arg3, %int0_2883, %int3_2884 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_2885 = torch.constant.int 0 %int0_2886 = torch.constant.int 0 %int9223372036854775807_2887 = torch.constant.int 9223372036854775807 %int1_2888 = torch.constant.int 1 %2662 = torch.aten.slice.Tensor %2661, %int0_2885, %int0_2886, %int9223372036854775807_2887, %int1_2888 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_2889 = torch.constant.int 16 %2663 = torch.aten.floor_divide.Scalar %2660, %int16_2889 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_2890 = torch.constant.int 0 %2664 = torch.aten.index_select %2662, %int0_2890, %2663 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_2891 = torch.constant.int 16 %2665 = torch.aten.remainder.Scalar %2660, %int16_2891 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_2892 = torch.constant.none %2666 = torch.aten.clone %362, %none_2892 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2893 = torch.constant.none %2667 = torch.aten.clone %363, %none_2893 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2894 = torch.constant.int 0 %2668 = torch.aten.unsqueeze %2665, %int0_2894 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2895 = torch.constant.int 0 %int3_2896 = torch.constant.int 3 %2669 = torch.aten.select.int %2572, %int0_2895, %int3_2896 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2897 = torch.constant.int 0 %int0_2898 = torch.constant.int 0 %2670 = torch.aten.select.int %2669, %int0_2897, %int0_2898 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2671 = torch.prim.ListConstruct %2664, %2666, %2667, %2668 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2899 = torch.constant.bool false %2672 = torch.aten.index_put %2659, %2671, %2670, %false_2899 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2900 = torch.constant.int 2662400 %2673 = torch.prim.ListConstruct %731, %int2662400_2900 : (!torch.int, !torch.int) -> !torch.list %2674 = torch.aten.view %2672, %2673 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_2901 = torch.constant.int -1 %int26_2902 = torch.constant.int 26 %int2_2903 = torch.constant.int 2 %int16_2904 = torch.constant.int 16 %int32_2905 = torch.constant.int 32 %int100_2906 = torch.constant.int 100 %2675 = torch.prim.ListConstruct %int-1_2901, %int26_2902, %int2_2903, %int16_2904, %int32_2905, %int100_2906 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2676 = torch.aten.view %2674, %2675 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_2907 = torch.constant.none %2677 = torch.aten.clone %364, %none_2907 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_2908 = torch.constant.none %2678 = torch.aten.clone %365, %none_2908 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_2909 = torch.constant.int 0 %2679 = torch.aten.unsqueeze %2665, %int0_2909 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_2910 = torch.constant.int 0 %int3_2911 = torch.constant.int 3 %2680 = torch.aten.select.int %2558, %int0_2910, %int3_2911 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_2912 = torch.constant.int 0 %int0_2913 = torch.constant.int 0 %2681 = torch.aten.select.int %2680, %int0_2912, %int0_2913 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2682 = torch.prim.ListConstruct %2664, %2677, %2678, %2679 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_2914 = torch.constant.bool false %2683 = torch.aten.index_put %2676, %2682, %2681, %false_2914 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_2915 = torch.constant.int 2662400 %2684 = torch.prim.ListConstruct %731, %int2662400_2915 : (!torch.int, !torch.int) -> !torch.list %2685 = torch.aten.view %2683, %2684 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_2916 = torch.constant.int 52 %2686 = torch.aten.mul.Scalar %arg3, %int52_2916 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int14 = torch.constant.int 14 %int1_2917 = torch.constant.int 1 %2687 = torch.aten.add.Scalar %2686, %int14, %int1_2917 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_2918 = torch.constant.int 4 %2688 = torch.aten.mul.int %int4_2918, %655 : !torch.int, !torch.int -> !torch.int %2689 = torch.prim.ListConstruct %2688 : (!torch.int) -> !torch.list %2690 = torch.aten.view %2687, %2689 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_2919 = torch.constant.int -1 %int26_2920 = torch.constant.int 26 %int2_2921 = torch.constant.int 2 %int16_2922 = torch.constant.int 16 %int32_2923 = torch.constant.int 32 %int100_2924 = torch.constant.int 100 %2691 = torch.prim.ListConstruct %int-1_2919, %int26_2920, %int2_2921, %int16_2922, %int32_2923, %int100_2924 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2692 = torch.aten.view %2685, %2691 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_2925 = torch.constant.int 26 %2693 = torch.aten.mul.int %731, %int26_2925 : !torch.int, !torch.int -> !torch.int %int2_2926 = torch.constant.int 2 %2694 = torch.aten.mul.int %2693, %int2_2926 : !torch.int, !torch.int -> !torch.int %int16_2927 = torch.constant.int 16 %int32_2928 = torch.constant.int 32 %int100_2929 = torch.constant.int 100 %2695 = torch.prim.ListConstruct %2694, %int16_2927, %int32_2928, %int100_2929 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2696 = torch.aten.view %2692, %2695 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_2930 = torch.constant.int 0 %2697 = torch.aten.index_select %2696, %int0_2930, %2690 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_2931 = torch.constant.int 4 %int16_2932 = torch.constant.int 16 %int32_2933 = torch.constant.int 32 %int100_2934 = torch.constant.int 100 %2698 = torch.prim.ListConstruct %int4_2931, %655, %int16_2932, %int32_2933, %int100_2934 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2699 = torch.aten.view %2697, %2698 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_2935 = torch.constant.int 1 %2700 = torch.aten.size.int %2699, %int1_2935 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_2936 = torch.constant.int 16 %2701 = torch.aten.mul.int %2700, %int16_2936 : !torch.int, !torch.int -> !torch.int %int4_2937 = torch.constant.int 4 %int32_2938 = torch.constant.int 32 %int100_2939 = torch.constant.int 100 %2702 = torch.prim.ListConstruct %int4_2937, %2701, %int32_2938, %int100_2939 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2703 = torch.aten.view %2699, %2702 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_2940 = torch.constant.int 0 %int0_2941 = torch.constant.int 0 %int9223372036854775807_2942 = torch.constant.int 9223372036854775807 %int1_2943 = torch.constant.int 1 %2704 = torch.aten.slice.Tensor %2445, %int0_2940, %int0_2941, %int9223372036854775807_2942, %int1_2943 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_2944 = torch.constant.int 16 %2705 = torch.aten.mul.int %655, %int16_2944 : !torch.int, !torch.int -> !torch.int %int1_2945 = torch.constant.int 1 %int0_2946 = torch.constant.int 0 %int1_2947 = torch.constant.int 1 %2706 = torch.aten.slice.Tensor %2704, %int1_2945, %int0_2946, %2705, %int1_2947 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_2948 = torch.constant.bool false %2707 = torch.aten.copy %2706, %2703, %false_2948 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_2949 = torch.constant.int 0 %int0_2950 = torch.constant.int 0 %int9223372036854775807_2951 = torch.constant.int 9223372036854775807 %int1_2952 = torch.constant.int 1 %2708 = torch.aten.slice.Tensor %2445, %int0_2949, %int0_2950, %int9223372036854775807_2951, %int1_2952 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2953 = torch.constant.int 1 %int0_2954 = torch.constant.int 0 %int1_2955 = torch.constant.int 1 %2709 = torch.aten.slice_scatter %2708, %2707, %int1_2953, %int0_2954, %2705, %int1_2955 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_2956 = torch.constant.int 0 %int0_2957 = torch.constant.int 0 %int9223372036854775807_2958 = torch.constant.int 9223372036854775807 %int1_2959 = torch.constant.int 1 %2710 = torch.aten.slice_scatter %2445, %2709, %int0_2956, %int0_2957, %int9223372036854775807_2958, %int1_2959 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2960 = torch.constant.int 1 %int1_2961 = torch.constant.int 1 %2711 = torch.aten.add.Scalar %2687, %int1_2960, %int1_2961 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_2962 = torch.constant.int 4 %2712 = torch.aten.mul.int %int4_2962, %655 : !torch.int, !torch.int -> !torch.int %2713 = torch.prim.ListConstruct %2712 : (!torch.int) -> !torch.list %2714 = torch.aten.view %2711, %2713 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_2963 = torch.constant.int 0 %2715 = torch.aten.index_select %2696, %int0_2963, %2714 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_2964 = torch.constant.int 4 %int16_2965 = torch.constant.int 16 %int32_2966 = torch.constant.int 32 %int100_2967 = torch.constant.int 100 %2716 = torch.prim.ListConstruct %int4_2964, %655, %int16_2965, %int32_2966, %int100_2967 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2717 = torch.aten.view %2715, %2716 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_2968 = torch.constant.int 1 %2718 = torch.aten.size.int %2717, %int1_2968 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_2969 = torch.constant.int 16 %2719 = torch.aten.mul.int %2718, %int16_2969 : !torch.int, !torch.int -> !torch.int %int4_2970 = torch.constant.int 4 %int32_2971 = torch.constant.int 32 %int100_2972 = torch.constant.int 100 %2720 = torch.prim.ListConstruct %int4_2970, %2719, %int32_2971, %int100_2972 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2721 = torch.aten.view %2717, %2720 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_2973 = torch.constant.int 0 %int0_2974 = torch.constant.int 0 %int9223372036854775807_2975 = torch.constant.int 9223372036854775807 %int1_2976 = torch.constant.int 1 %2722 = torch.aten.slice.Tensor %2462, %int0_2973, %int0_2974, %int9223372036854775807_2975, %int1_2976 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2977 = torch.constant.int 1 %int0_2978 = torch.constant.int 0 %int1_2979 = torch.constant.int 1 %2723 = torch.aten.slice.Tensor %2722, %int1_2977, %int0_2978, %2705, %int1_2979 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_2980 = torch.constant.bool false %2724 = torch.aten.copy %2723, %2721, %false_2980 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_2981 = torch.constant.int 0 %int0_2982 = torch.constant.int 0 %int9223372036854775807_2983 = torch.constant.int 9223372036854775807 %int1_2984 = torch.constant.int 1 %2725 = torch.aten.slice.Tensor %2462, %int0_2981, %int0_2982, %int9223372036854775807_2983, %int1_2984 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2985 = torch.constant.int 1 %int0_2986 = torch.constant.int 0 %int1_2987 = torch.constant.int 1 %2726 = torch.aten.slice_scatter %2725, %2724, %int1_2985, %int0_2986, %2705, %int1_2987 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_2988 = torch.constant.int 0 %int0_2989 = torch.constant.int 0 %int9223372036854775807_2990 = torch.constant.int 9223372036854775807 %int1_2991 = torch.constant.int 1 %2727 = torch.aten.slice_scatter %2462, %2726, %int0_2988, %int0_2989, %int9223372036854775807_2990, %int1_2991 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_2992 = torch.constant.int 0 %int0_2993 = torch.constant.int 0 %int9223372036854775807_2994 = torch.constant.int 9223372036854775807 %int1_2995 = torch.constant.int 1 %2728 = torch.aten.slice.Tensor %671, %int0_2992, %int0_2993, %int9223372036854775807_2994, %int1_2995 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_2996 = torch.constant.int 1 %int0_2997 = torch.constant.int 0 %int1_2998 = torch.constant.int 1 %2729 = torch.aten.slice.Tensor %2728, %int1_2996, %int0_2997, %2705, %int1_2998 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_2999 = torch.constant.int 0 %int0_3000 = torch.constant.int 0 %int9223372036854775807_3001 = torch.constant.int 9223372036854775807 %int1_3002 = torch.constant.int 1 %2730 = torch.aten.slice.Tensor %673, %int0_2999, %int0_3000, %int9223372036854775807_3001, %int1_3002 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3003 = torch.constant.int 1 %int0_3004 = torch.constant.int 0 %int1_3005 = torch.constant.int 1 %2731 = torch.aten.slice.Tensor %2730, %int1_3003, %int0_3004, %2705, %int1_3005 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_3006 = torch.constant.int 1 %int2_3007 = torch.constant.int 2 %2732 = torch.aten.transpose.int %2568, %int1_3006, %int2_3007 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_3008 = torch.constant.int 4 %int32_3009 = torch.constant.int 32 %int1_3010 = torch.constant.int 1 %int100_3011 = torch.constant.int 100 %2733 = torch.prim.ListConstruct %int4_3008, %int32_3009, %int1_3010, %int100_3011 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3012 = torch.constant.bool false %2734 = torch.aten.expand %2732, %2733, %false_3012 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_3013 = torch.constant.int 128 %int1_3014 = torch.constant.int 1 %int100_3015 = torch.constant.int 100 %2735 = torch.prim.ListConstruct %int128_3013, %int1_3014, %int100_3015 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2736 = torch.aten.view %2734, %2735 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_3016 = torch.constant.int 0 %int0_3017 = torch.constant.int 0 %int9223372036854775807_3018 = torch.constant.int 9223372036854775807 %int1_3019 = torch.constant.int 1 %2737 = torch.aten.slice.Tensor %2710, %int0_3016, %int0_3017, %int9223372036854775807_3018, %int1_3019 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3020 = torch.constant.int 1 %int0_3021 = torch.constant.int 0 %int1_3022 = torch.constant.int 1 %2738 = torch.aten.slice.Tensor %2737, %int1_3020, %int0_3021, %2705, %int1_3022 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_3023 = torch.constant.int 1 %int2_3024 = torch.constant.int 2 %2739 = torch.aten.transpose.int %2738, %int1_3023, %int2_3024 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_3025 = torch.constant.int 2 %int3_3026 = torch.constant.int 3 %2740 = torch.aten.transpose.int %2739, %int2_3025, %int3_3026 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_3027 = torch.constant.int 1 %2741 = torch.aten.size.int %2729, %int1_3027 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_3028 = torch.constant.int 4 %int32_3029 = torch.constant.int 32 %int100_3030 = torch.constant.int 100 %2742 = torch.prim.ListConstruct %int4_3028, %int32_3029, %int100_3030, %2741 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3031 = torch.constant.bool false %2743 = torch.aten.expand %2740, %2742, %false_3031 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_3032 = torch.constant.int 0 %2744 = torch.aten.clone %2743, %int0_3032 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_3033 = torch.constant.int 128 %int100_3034 = torch.constant.int 100 %2745 = torch.prim.ListConstruct %int128_3033, %int100_3034, %2741 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2746 = torch.aten._unsafe_view %2744, %2745 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %2747 = torch.aten.bmm %2736, %2746 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_3035 = torch.constant.int 4 %int32_3036 = torch.constant.int 32 %int1_3037 = torch.constant.int 1 %2748 = torch.prim.ListConstruct %int4_3035, %int32_3036, %int1_3037, %2741 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2749 = torch.aten.view %2747, %2748 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_3038 = torch.constant.float 1.000000e+01 %2750 = torch.aten.div.Scalar %2749, %float1.000000e01_3038 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_3039 = torch.constant.int 1 %2751 = torch.aten.add.Tensor %2750, %895, %int1_3039 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_3040 = torch.constant.int -1 %false_3041 = torch.constant.bool false %2752 = torch.aten._softmax %2751, %int-1_3040, %false_3041 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_3042 = torch.constant.int 4 %int32_3043 = torch.constant.int 32 %int1_3044 = torch.constant.int 1 %2753 = torch.prim.ListConstruct %int4_3042, %int32_3043, %int1_3044, %2741 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3045 = torch.constant.bool false %2754 = torch.aten.expand %2752, %2753, %false_3045 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_3046 = torch.constant.int 128 %int1_3047 = torch.constant.int 1 %2755 = torch.prim.ListConstruct %int128_3046, %int1_3047, %2741 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2756 = torch.aten.view %2754, %2755 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_3048 = torch.constant.int 0 %int0_3049 = torch.constant.int 0 %int9223372036854775807_3050 = torch.constant.int 9223372036854775807 %int1_3051 = torch.constant.int 1 %2757 = torch.aten.slice.Tensor %2727, %int0_3048, %int0_3049, %int9223372036854775807_3050, %int1_3051 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3052 = torch.constant.int 1 %int0_3053 = torch.constant.int 0 %int1_3054 = torch.constant.int 1 %2758 = torch.aten.slice.Tensor %2757, %int1_3052, %int0_3053, %2705, %int1_3054 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_3055 = torch.constant.int 1 %int2_3056 = torch.constant.int 2 %2759 = torch.aten.transpose.int %2758, %int1_3055, %int2_3056 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_3057 = torch.constant.int 1 %2760 = torch.aten.size.int %2731, %int1_3057 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_3058 = torch.constant.int 4 %int32_3059 = torch.constant.int 32 %int100_3060 = torch.constant.int 100 %2761 = torch.prim.ListConstruct %int4_3058, %int32_3059, %2760, %int100_3060 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3061 = torch.constant.bool false %2762 = torch.aten.expand %2759, %2761, %false_3061 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_3062 = torch.constant.int 0 %2763 = torch.aten.clone %2762, %int0_3062 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_3063 = torch.constant.int 128 %int100_3064 = torch.constant.int 100 %2764 = torch.prim.ListConstruct %int128_3063, %2760, %int100_3064 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2765 = torch.aten._unsafe_view %2763, %2764 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %2766 = torch.aten.bmm %2756, %2765 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_3065 = torch.constant.int 4 %int32_3066 = torch.constant.int 32 %int1_3067 = torch.constant.int 1 %int100_3068 = torch.constant.int 100 %2767 = torch.prim.ListConstruct %int4_3065, %int32_3066, %int1_3067, %int100_3068 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2768 = torch.aten.view %2766, %2767 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_3069 = torch.constant.int 1 %int2_3070 = torch.constant.int 2 %2769 = torch.aten.transpose.int %2768, %int1_3069, %int2_3070 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_3071 = torch.constant.int 4 %int1_3072 = torch.constant.int 1 %int-1_3073 = torch.constant.int -1 %2770 = torch.prim.ListConstruct %int4_3071, %int1_3072, %int-1_3073 : (!torch.int, !torch.int, !torch.int) -> !torch.list %2771 = torch.aten.view %2769, %2770 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %2772 = torch_c.to_builtin_tensor %2771 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3074 = tensor.cast %2772 : tensor<4x1x3200xf32> to tensor %2773 = torch_c.to_builtin_tensor %69 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2774 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3074, %2773) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3075 = tensor.cast %2774 : tensor to tensor<4x1x3200xf32> %2775 = torch_c.from_builtin_tensor %cast_3075 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_3076 = torch.constant.int 1 %2776 = torch.aten.add.Tensor %2533, %2775, %int1_3076 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_3077 = torch.constant.int 2 %2777 = torch.aten.pow.Tensor_Scalar %2776, %int2_3077 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_3078 = torch.constant.int -1 %2778 = torch.prim.ListConstruct %int-1_3078 : (!torch.int) -> !torch.list %true_3079 = torch.constant.bool true %none_3080 = torch.constant.none %2779 = torch.aten.mean.dim %2777, %2778, %true_3079, %none_3080 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_3081 = torch.constant.float 9.9999999747524271E-7 %int1_3082 = torch.constant.int 1 %2780 = torch.aten.add.Scalar %2779, %float9.999990e-07_3081, %int1_3082 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %2781 = torch.aten.rsqrt %2780 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %2782 = torch.aten.mul.Tensor %2776, %2781 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %2783 = torch.aten.mul.Tensor %2782, %70 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %2784 = torch_c.to_builtin_tensor %2783 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3083 = tensor.cast %2784 : tensor<4x1x3200xf32> to tensor %2785 = torch_c.to_builtin_tensor %71 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %2786 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_3083, %2785) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_3084 = tensor.cast %2786 : tensor to tensor<4x1x8640xf32> %2787 = torch_c.from_builtin_tensor %cast_3084 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %2788 = torch.aten.silu %2787 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %2789 = torch_c.to_builtin_tensor %2783 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3085 = tensor.cast %2789 : tensor<4x1x3200xf32> to tensor %2790 = torch_c.to_builtin_tensor %72 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %2791 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_3085, %2790) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_3086 = tensor.cast %2791 : tensor to tensor<4x1x8640xf32> %2792 = torch_c.from_builtin_tensor %cast_3086 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %2793 = torch.aten.mul.Tensor %2788, %2792 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %2794 = torch_c.to_builtin_tensor %2793 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_3087 = tensor.cast %2794 : tensor<4x1x8640xf32> to tensor %2795 = torch_c.to_builtin_tensor %73 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %2796 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_3087, %2795) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_3088 = tensor.cast %2796 : tensor to tensor<4x1x3200xf32> %2797 = torch_c.from_builtin_tensor %cast_3088 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_3089 = torch.constant.int 1 %2798 = torch.aten.add.Tensor %2776, %2797, %int1_3089 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_3090 = torch.constant.int 2 %2799 = torch.aten.pow.Tensor_Scalar %2798, %int2_3090 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_3091 = torch.constant.int -1 %2800 = torch.prim.ListConstruct %int-1_3091 : (!torch.int) -> !torch.list %true_3092 = torch.constant.bool true %none_3093 = torch.constant.none %2801 = torch.aten.mean.dim %2799, %2800, %true_3092, %none_3093 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_3094 = torch.constant.float 9.9999999747524271E-7 %int1_3095 = torch.constant.int 1 %2802 = torch.aten.add.Scalar %2801, %float9.999990e-07_3094, %int1_3095 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %2803 = torch.aten.rsqrt %2802 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %2804 = torch.aten.mul.Tensor %2798, %2803 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %2805 = torch.aten.mul.Tensor %2804, %74 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %2806 = torch_c.to_builtin_tensor %2805 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3096 = tensor.cast %2806 : tensor<4x1x3200xf32> to tensor %2807 = torch_c.to_builtin_tensor %75 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2808 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3096, %2807) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3097 = tensor.cast %2808 : tensor to tensor<4x1x3200xf32> %2809 = torch_c.from_builtin_tensor %cast_3097 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %2810 = torch_c.to_builtin_tensor %2805 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3098 = tensor.cast %2810 : tensor<4x1x3200xf32> to tensor %2811 = torch_c.to_builtin_tensor %76 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2812 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3098, %2811) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3099 = tensor.cast %2812 : tensor to tensor<4x1x3200xf32> %2813 = torch_c.from_builtin_tensor %cast_3099 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %2814 = torch_c.to_builtin_tensor %2805 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3100 = tensor.cast %2814 : tensor<4x1x3200xf32> to tensor %2815 = torch_c.to_builtin_tensor %77 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %2816 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3100, %2815) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3101 = tensor.cast %2816 : tensor to tensor<4x1x3200xf32> %2817 = torch_c.from_builtin_tensor %cast_3101 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_3102 = torch.constant.int 4 %int1_3103 = torch.constant.int 1 %int32_3104 = torch.constant.int 32 %int100_3105 = torch.constant.int 100 %2818 = torch.prim.ListConstruct %int4_3102, %int1_3103, %int32_3104, %int100_3105 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2819 = torch.aten.view %2809, %2818 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_3106 = torch.constant.int 4 %int1_3107 = torch.constant.int 1 %int32_3108 = torch.constant.int 32 %int100_3109 = torch.constant.int 100 %2820 = torch.prim.ListConstruct %int4_3106, %int1_3107, %int32_3108, %int100_3109 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2821 = torch.aten.view %2813, %2820 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_3110 = torch.constant.int 4 %int1_3111 = torch.constant.int 1 %int32_3112 = torch.constant.int 32 %int100_3113 = torch.constant.int 100 %2822 = torch.prim.ListConstruct %int4_3110, %int1_3111, %int32_3112, %int100_3113 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2823 = torch.aten.view %2817, %2822 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_3114 = torch.constant.int 4 %int1_3115 = torch.constant.int 1 %int32_3116 = torch.constant.int 32 %int-1_3117 = torch.constant.int -1 %int2_3118 = torch.constant.int 2 %2824 = torch.prim.ListConstruct %int4_3114, %int1_3115, %int32_3116, %int-1_3117, %int2_3118 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2825 = torch.aten.view %2819, %2824 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %2826 = torch.aten.view_as_complex %2825 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_3119 = torch.constant.int 4 %int1_3120 = torch.constant.int 1 %int32_3121 = torch.constant.int 32 %int-1_3122 = torch.constant.int -1 %int2_3123 = torch.constant.int 2 %2827 = torch.prim.ListConstruct %int4_3119, %int1_3120, %int32_3121, %int-1_3122, %int2_3123 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2828 = torch.aten.view %2821, %2827 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %2829 = torch.aten.view_as_complex %2828 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %2830 = torch.aten.mul.Tensor %2826, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %2831 = torch.aten.view_as_real %2830 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_3124 = torch.constant.int 4 %int1_3125 = torch.constant.int 1 %int32_3126 = torch.constant.int 32 %int100_3127 = torch.constant.int 100 %2832 = torch.prim.ListConstruct %int4_3124, %int1_3125, %int32_3126, %int100_3127 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2833 = torch.aten.view %2831, %2832 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %2834 = torch.aten.mul.Tensor %2829, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %2835 = torch.aten.view_as_real %2834 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_3128 = torch.constant.int 4 %int1_3129 = torch.constant.int 1 %int32_3130 = torch.constant.int 32 %int100_3131 = torch.constant.int 100 %2836 = torch.prim.ListConstruct %int4_3128, %int1_3129, %int32_3130, %int100_3131 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2837 = torch.aten.view %2835, %2836 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_3132 = torch.constant.int 1 %int1_3133 = torch.constant.int 1 %2838 = torch.aten.add.Scalar %arg2, %int1_3132, %int1_3133 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_3134 = torch.constant.int 0 %int0_3135 = torch.constant.int 0 %2839 = torch.aten.select.int %2838, %int0_3134, %int0_3135 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3136 = torch.constant.int 0 %int0_3137 = torch.constant.int 0 %2840 = torch.aten.select.int %arg3, %int0_3136, %int0_3137 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3138 = torch.constant.int 0 %int0_3139 = torch.constant.int 0 %int9223372036854775807_3140 = torch.constant.int 9223372036854775807 %int1_3141 = torch.constant.int 1 %2841 = torch.aten.slice.Tensor %2840, %int0_3138, %int0_3139, %int9223372036854775807_3140, %int1_3141 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3142 = torch.constant.int 16 %2842 = torch.aten.floor_divide.Scalar %2839, %int16_3142 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3143 = torch.constant.int 0 %2843 = torch.aten.index_select %2841, %int0_3143, %2842 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3144 = torch.constant.int 16 %2844 = torch.aten.remainder.Scalar %2839, %int16_3144 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3145 = torch.constant.none %2845 = torch.aten.clone %366, %none_3145 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3146 = torch.constant.none %2846 = torch.aten.clone %367, %none_3146 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3147 = torch.constant.int 0 %2847 = torch.aten.unsqueeze %2844, %int0_3147 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3148 = torch.constant.int 0 %int0_3149 = torch.constant.int 0 %2848 = torch.aten.select.int %2837, %int0_3148, %int0_3149 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3150 = torch.constant.int 0 %int0_3151 = torch.constant.int 0 %2849 = torch.aten.select.int %2848, %int0_3150, %int0_3151 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_3152 = torch.constant.int -1 %int26_3153 = torch.constant.int 26 %int2_3154 = torch.constant.int 2 %int16_3155 = torch.constant.int 16 %int32_3156 = torch.constant.int 32 %int100_3157 = torch.constant.int 100 %2850 = torch.prim.ListConstruct %int-1_3152, %int26_3153, %int2_3154, %int16_3155, %int32_3156, %int100_3157 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2851 = torch.aten.view %2685, %2850 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %2852 = torch.prim.ListConstruct %2843, %2845, %2846, %2847 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3158 = torch.constant.bool false %2853 = torch.aten.index_put %2851, %2852, %2849, %false_3158 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3159 = torch.constant.int 2662400 %2854 = torch.prim.ListConstruct %731, %int2662400_3159 : (!torch.int, !torch.int) -> !torch.list %2855 = torch.aten.view %2853, %2854 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3160 = torch.constant.int -1 %int26_3161 = torch.constant.int 26 %int2_3162 = torch.constant.int 2 %int16_3163 = torch.constant.int 16 %int32_3164 = torch.constant.int 32 %int100_3165 = torch.constant.int 100 %2856 = torch.prim.ListConstruct %int-1_3160, %int26_3161, %int2_3162, %int16_3163, %int32_3164, %int100_3165 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2857 = torch.aten.view %2855, %2856 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3166 = torch.constant.none %2858 = torch.aten.clone %368, %none_3166 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3167 = torch.constant.none %2859 = torch.aten.clone %369, %none_3167 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3168 = torch.constant.int 0 %2860 = torch.aten.unsqueeze %2844, %int0_3168 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3169 = torch.constant.int 0 %int0_3170 = torch.constant.int 0 %2861 = torch.aten.select.int %2823, %int0_3169, %int0_3170 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3171 = torch.constant.int 0 %int0_3172 = torch.constant.int 0 %2862 = torch.aten.select.int %2861, %int0_3171, %int0_3172 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2863 = torch.prim.ListConstruct %2843, %2858, %2859, %2860 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3173 = torch.constant.bool false %2864 = torch.aten.index_put %2857, %2863, %2862, %false_3173 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3174 = torch.constant.int 2662400 %2865 = torch.prim.ListConstruct %731, %int2662400_3174 : (!torch.int, !torch.int) -> !torch.list %2866 = torch.aten.view %2864, %2865 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3175 = torch.constant.int -1 %int26_3176 = torch.constant.int 26 %int2_3177 = torch.constant.int 2 %int16_3178 = torch.constant.int 16 %int32_3179 = torch.constant.int 32 %int100_3180 = torch.constant.int 100 %2867 = torch.prim.ListConstruct %int-1_3175, %int26_3176, %int2_3177, %int16_3178, %int32_3179, %int100_3180 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2868 = torch.aten.view %2866, %2867 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_3181 = torch.constant.int 0 %int1_3182 = torch.constant.int 1 %2869 = torch.aten.select.int %2838, %int0_3181, %int1_3182 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3183 = torch.constant.int 0 %int1_3184 = torch.constant.int 1 %2870 = torch.aten.select.int %arg3, %int0_3183, %int1_3184 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3185 = torch.constant.int 0 %int0_3186 = torch.constant.int 0 %int9223372036854775807_3187 = torch.constant.int 9223372036854775807 %int1_3188 = torch.constant.int 1 %2871 = torch.aten.slice.Tensor %2870, %int0_3185, %int0_3186, %int9223372036854775807_3187, %int1_3188 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3189 = torch.constant.int 16 %2872 = torch.aten.floor_divide.Scalar %2869, %int16_3189 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3190 = torch.constant.int 0 %2873 = torch.aten.index_select %2871, %int0_3190, %2872 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3191 = torch.constant.int 16 %2874 = torch.aten.remainder.Scalar %2869, %int16_3191 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3192 = torch.constant.none %2875 = torch.aten.clone %370, %none_3192 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3193 = torch.constant.none %2876 = torch.aten.clone %371, %none_3193 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3194 = torch.constant.int 0 %2877 = torch.aten.unsqueeze %2874, %int0_3194 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3195 = torch.constant.int 0 %int1_3196 = torch.constant.int 1 %2878 = torch.aten.select.int %2837, %int0_3195, %int1_3196 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3197 = torch.constant.int 0 %int0_3198 = torch.constant.int 0 %2879 = torch.aten.select.int %2878, %int0_3197, %int0_3198 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2880 = torch.prim.ListConstruct %2873, %2875, %2876, %2877 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3199 = torch.constant.bool false %2881 = torch.aten.index_put %2868, %2880, %2879, %false_3199 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3200 = torch.constant.int 2662400 %2882 = torch.prim.ListConstruct %731, %int2662400_3200 : (!torch.int, !torch.int) -> !torch.list %2883 = torch.aten.view %2881, %2882 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3201 = torch.constant.int -1 %int26_3202 = torch.constant.int 26 %int2_3203 = torch.constant.int 2 %int16_3204 = torch.constant.int 16 %int32_3205 = torch.constant.int 32 %int100_3206 = torch.constant.int 100 %2884 = torch.prim.ListConstruct %int-1_3201, %int26_3202, %int2_3203, %int16_3204, %int32_3205, %int100_3206 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2885 = torch.aten.view %2883, %2884 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3207 = torch.constant.none %2886 = torch.aten.clone %372, %none_3207 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3208 = torch.constant.none %2887 = torch.aten.clone %373, %none_3208 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3209 = torch.constant.int 0 %2888 = torch.aten.unsqueeze %2874, %int0_3209 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3210 = torch.constant.int 0 %int1_3211 = torch.constant.int 1 %2889 = torch.aten.select.int %2823, %int0_3210, %int1_3211 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3212 = torch.constant.int 0 %int0_3213 = torch.constant.int 0 %2890 = torch.aten.select.int %2889, %int0_3212, %int0_3213 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2891 = torch.prim.ListConstruct %2873, %2886, %2887, %2888 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3214 = torch.constant.bool false %2892 = torch.aten.index_put %2885, %2891, %2890, %false_3214 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3215 = torch.constant.int 2662400 %2893 = torch.prim.ListConstruct %731, %int2662400_3215 : (!torch.int, !torch.int) -> !torch.list %2894 = torch.aten.view %2892, %2893 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3216 = torch.constant.int -1 %int26_3217 = torch.constant.int 26 %int2_3218 = torch.constant.int 2 %int16_3219 = torch.constant.int 16 %int32_3220 = torch.constant.int 32 %int100_3221 = torch.constant.int 100 %2895 = torch.prim.ListConstruct %int-1_3216, %int26_3217, %int2_3218, %int16_3219, %int32_3220, %int100_3221 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2896 = torch.aten.view %2894, %2895 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_3222 = torch.constant.int 0 %int2_3223 = torch.constant.int 2 %2897 = torch.aten.select.int %2838, %int0_3222, %int2_3223 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3224 = torch.constant.int 0 %int2_3225 = torch.constant.int 2 %2898 = torch.aten.select.int %arg3, %int0_3224, %int2_3225 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3226 = torch.constant.int 0 %int0_3227 = torch.constant.int 0 %int9223372036854775807_3228 = torch.constant.int 9223372036854775807 %int1_3229 = torch.constant.int 1 %2899 = torch.aten.slice.Tensor %2898, %int0_3226, %int0_3227, %int9223372036854775807_3228, %int1_3229 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3230 = torch.constant.int 16 %2900 = torch.aten.floor_divide.Scalar %2897, %int16_3230 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3231 = torch.constant.int 0 %2901 = torch.aten.index_select %2899, %int0_3231, %2900 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3232 = torch.constant.int 16 %2902 = torch.aten.remainder.Scalar %2897, %int16_3232 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3233 = torch.constant.none %2903 = torch.aten.clone %374, %none_3233 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3234 = torch.constant.none %2904 = torch.aten.clone %375, %none_3234 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3235 = torch.constant.int 0 %2905 = torch.aten.unsqueeze %2902, %int0_3235 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3236 = torch.constant.int 0 %int2_3237 = torch.constant.int 2 %2906 = torch.aten.select.int %2837, %int0_3236, %int2_3237 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3238 = torch.constant.int 0 %int0_3239 = torch.constant.int 0 %2907 = torch.aten.select.int %2906, %int0_3238, %int0_3239 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2908 = torch.prim.ListConstruct %2901, %2903, %2904, %2905 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3240 = torch.constant.bool false %2909 = torch.aten.index_put %2896, %2908, %2907, %false_3240 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3241 = torch.constant.int 2662400 %2910 = torch.prim.ListConstruct %731, %int2662400_3241 : (!torch.int, !torch.int) -> !torch.list %2911 = torch.aten.view %2909, %2910 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3242 = torch.constant.int -1 %int26_3243 = torch.constant.int 26 %int2_3244 = torch.constant.int 2 %int16_3245 = torch.constant.int 16 %int32_3246 = torch.constant.int 32 %int100_3247 = torch.constant.int 100 %2912 = torch.prim.ListConstruct %int-1_3242, %int26_3243, %int2_3244, %int16_3245, %int32_3246, %int100_3247 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2913 = torch.aten.view %2911, %2912 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3248 = torch.constant.none %2914 = torch.aten.clone %376, %none_3248 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3249 = torch.constant.none %2915 = torch.aten.clone %377, %none_3249 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3250 = torch.constant.int 0 %2916 = torch.aten.unsqueeze %2902, %int0_3250 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3251 = torch.constant.int 0 %int2_3252 = torch.constant.int 2 %2917 = torch.aten.select.int %2823, %int0_3251, %int2_3252 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3253 = torch.constant.int 0 %int0_3254 = torch.constant.int 0 %2918 = torch.aten.select.int %2917, %int0_3253, %int0_3254 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2919 = torch.prim.ListConstruct %2901, %2914, %2915, %2916 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3255 = torch.constant.bool false %2920 = torch.aten.index_put %2913, %2919, %2918, %false_3255 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3256 = torch.constant.int 2662400 %2921 = torch.prim.ListConstruct %731, %int2662400_3256 : (!torch.int, !torch.int) -> !torch.list %2922 = torch.aten.view %2920, %2921 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3257 = torch.constant.int -1 %int26_3258 = torch.constant.int 26 %int2_3259 = torch.constant.int 2 %int16_3260 = torch.constant.int 16 %int32_3261 = torch.constant.int 32 %int100_3262 = torch.constant.int 100 %2923 = torch.prim.ListConstruct %int-1_3257, %int26_3258, %int2_3259, %int16_3260, %int32_3261, %int100_3262 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2924 = torch.aten.view %2922, %2923 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_3263 = torch.constant.int 0 %int3_3264 = torch.constant.int 3 %2925 = torch.aten.select.int %2838, %int0_3263, %int3_3264 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3265 = torch.constant.int 0 %int3_3266 = torch.constant.int 3 %2926 = torch.aten.select.int %arg3, %int0_3265, %int3_3266 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3267 = torch.constant.int 0 %int0_3268 = torch.constant.int 0 %int9223372036854775807_3269 = torch.constant.int 9223372036854775807 %int1_3270 = torch.constant.int 1 %2927 = torch.aten.slice.Tensor %2926, %int0_3267, %int0_3268, %int9223372036854775807_3269, %int1_3270 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3271 = torch.constant.int 16 %2928 = torch.aten.floor_divide.Scalar %2925, %int16_3271 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3272 = torch.constant.int 0 %2929 = torch.aten.index_select %2927, %int0_3272, %2928 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3273 = torch.constant.int 16 %2930 = torch.aten.remainder.Scalar %2925, %int16_3273 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3274 = torch.constant.none %2931 = torch.aten.clone %378, %none_3274 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3275 = torch.constant.none %2932 = torch.aten.clone %379, %none_3275 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3276 = torch.constant.int 0 %2933 = torch.aten.unsqueeze %2930, %int0_3276 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3277 = torch.constant.int 0 %int3_3278 = torch.constant.int 3 %2934 = torch.aten.select.int %2837, %int0_3277, %int3_3278 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3279 = torch.constant.int 0 %int0_3280 = torch.constant.int 0 %2935 = torch.aten.select.int %2934, %int0_3279, %int0_3280 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2936 = torch.prim.ListConstruct %2929, %2931, %2932, %2933 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3281 = torch.constant.bool false %2937 = torch.aten.index_put %2924, %2936, %2935, %false_3281 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3282 = torch.constant.int 2662400 %2938 = torch.prim.ListConstruct %731, %int2662400_3282 : (!torch.int, !torch.int) -> !torch.list %2939 = torch.aten.view %2937, %2938 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3283 = torch.constant.int -1 %int26_3284 = torch.constant.int 26 %int2_3285 = torch.constant.int 2 %int16_3286 = torch.constant.int 16 %int32_3287 = torch.constant.int 32 %int100_3288 = torch.constant.int 100 %2940 = torch.prim.ListConstruct %int-1_3283, %int26_3284, %int2_3285, %int16_3286, %int32_3287, %int100_3288 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2941 = torch.aten.view %2939, %2940 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3289 = torch.constant.none %2942 = torch.aten.clone %380, %none_3289 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3290 = torch.constant.none %2943 = torch.aten.clone %381, %none_3290 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3291 = torch.constant.int 0 %2944 = torch.aten.unsqueeze %2930, %int0_3291 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3292 = torch.constant.int 0 %int3_3293 = torch.constant.int 3 %2945 = torch.aten.select.int %2823, %int0_3292, %int3_3293 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3294 = torch.constant.int 0 %int0_3295 = torch.constant.int 0 %2946 = torch.aten.select.int %2945, %int0_3294, %int0_3295 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %2947 = torch.prim.ListConstruct %2929, %2942, %2943, %2944 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3296 = torch.constant.bool false %2948 = torch.aten.index_put %2941, %2947, %2946, %false_3296 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3297 = torch.constant.int 2662400 %2949 = torch.prim.ListConstruct %731, %int2662400_3297 : (!torch.int, !torch.int) -> !torch.list %2950 = torch.aten.view %2948, %2949 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_3298 = torch.constant.int 52 %2951 = torch.aten.mul.Scalar %arg3, %int52_3298 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int16_3299 = torch.constant.int 16 %int1_3300 = torch.constant.int 1 %2952 = torch.aten.add.Scalar %2951, %int16_3299, %int1_3300 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_3301 = torch.constant.int 4 %2953 = torch.aten.mul.int %int4_3301, %655 : !torch.int, !torch.int -> !torch.int %2954 = torch.prim.ListConstruct %2953 : (!torch.int) -> !torch.list %2955 = torch.aten.view %2952, %2954 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_3302 = torch.constant.int -1 %int26_3303 = torch.constant.int 26 %int2_3304 = torch.constant.int 2 %int16_3305 = torch.constant.int 16 %int32_3306 = torch.constant.int 32 %int100_3307 = torch.constant.int 100 %2956 = torch.prim.ListConstruct %int-1_3302, %int26_3303, %int2_3304, %int16_3305, %int32_3306, %int100_3307 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2957 = torch.aten.view %2950, %2956 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_3308 = torch.constant.int 26 %2958 = torch.aten.mul.int %731, %int26_3308 : !torch.int, !torch.int -> !torch.int %int2_3309 = torch.constant.int 2 %2959 = torch.aten.mul.int %2958, %int2_3309 : !torch.int, !torch.int -> !torch.int %int16_3310 = torch.constant.int 16 %int32_3311 = torch.constant.int 32 %int100_3312 = torch.constant.int 100 %2960 = torch.prim.ListConstruct %2959, %int16_3310, %int32_3311, %int100_3312 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2961 = torch.aten.view %2957, %2960 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_3313 = torch.constant.int 0 %2962 = torch.aten.index_select %2961, %int0_3313, %2955 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_3314 = torch.constant.int 4 %int16_3315 = torch.constant.int 16 %int32_3316 = torch.constant.int 32 %int100_3317 = torch.constant.int 100 %2963 = torch.prim.ListConstruct %int4_3314, %655, %int16_3315, %int32_3316, %int100_3317 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2964 = torch.aten.view %2962, %2963 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_3318 = torch.constant.int 1 %2965 = torch.aten.size.int %2964, %int1_3318 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_3319 = torch.constant.int 16 %2966 = torch.aten.mul.int %2965, %int16_3319 : !torch.int, !torch.int -> !torch.int %int4_3320 = torch.constant.int 4 %int32_3321 = torch.constant.int 32 %int100_3322 = torch.constant.int 100 %2967 = torch.prim.ListConstruct %int4_3320, %2966, %int32_3321, %int100_3322 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2968 = torch.aten.view %2964, %2967 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_3323 = torch.constant.int 0 %int0_3324 = torch.constant.int 0 %int9223372036854775807_3325 = torch.constant.int 9223372036854775807 %int1_3326 = torch.constant.int 1 %2969 = torch.aten.slice.Tensor %2710, %int0_3323, %int0_3324, %int9223372036854775807_3325, %int1_3326 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_3327 = torch.constant.int 16 %2970 = torch.aten.mul.int %655, %int16_3327 : !torch.int, !torch.int -> !torch.int %int1_3328 = torch.constant.int 1 %int0_3329 = torch.constant.int 0 %int1_3330 = torch.constant.int 1 %2971 = torch.aten.slice.Tensor %2969, %int1_3328, %int0_3329, %2970, %int1_3330 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_3331 = torch.constant.bool false %2972 = torch.aten.copy %2971, %2968, %false_3331 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_3332 = torch.constant.int 0 %int0_3333 = torch.constant.int 0 %int9223372036854775807_3334 = torch.constant.int 9223372036854775807 %int1_3335 = torch.constant.int 1 %2973 = torch.aten.slice.Tensor %2710, %int0_3332, %int0_3333, %int9223372036854775807_3334, %int1_3335 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3336 = torch.constant.int 1 %int0_3337 = torch.constant.int 0 %int1_3338 = torch.constant.int 1 %2974 = torch.aten.slice_scatter %2973, %2972, %int1_3336, %int0_3337, %2970, %int1_3338 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_3339 = torch.constant.int 0 %int0_3340 = torch.constant.int 0 %int9223372036854775807_3341 = torch.constant.int 9223372036854775807 %int1_3342 = torch.constant.int 1 %2975 = torch.aten.slice_scatter %2710, %2974, %int0_3339, %int0_3340, %int9223372036854775807_3341, %int1_3342 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3343 = torch.constant.int 1 %int1_3344 = torch.constant.int 1 %2976 = torch.aten.add.Scalar %2952, %int1_3343, %int1_3344 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_3345 = torch.constant.int 4 %2977 = torch.aten.mul.int %int4_3345, %655 : !torch.int, !torch.int -> !torch.int %2978 = torch.prim.ListConstruct %2977 : (!torch.int) -> !torch.list %2979 = torch.aten.view %2976, %2978 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_3346 = torch.constant.int 0 %2980 = torch.aten.index_select %2961, %int0_3346, %2979 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_3347 = torch.constant.int 4 %int16_3348 = torch.constant.int 16 %int32_3349 = torch.constant.int 32 %int100_3350 = torch.constant.int 100 %2981 = torch.prim.ListConstruct %int4_3347, %655, %int16_3348, %int32_3349, %int100_3350 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2982 = torch.aten.view %2980, %2981 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_3351 = torch.constant.int 1 %2983 = torch.aten.size.int %2982, %int1_3351 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_3352 = torch.constant.int 16 %2984 = torch.aten.mul.int %2983, %int16_3352 : !torch.int, !torch.int -> !torch.int %int4_3353 = torch.constant.int 4 %int32_3354 = torch.constant.int 32 %int100_3355 = torch.constant.int 100 %2985 = torch.prim.ListConstruct %int4_3353, %2984, %int32_3354, %int100_3355 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %2986 = torch.aten.view %2982, %2985 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_3356 = torch.constant.int 0 %int0_3357 = torch.constant.int 0 %int9223372036854775807_3358 = torch.constant.int 9223372036854775807 %int1_3359 = torch.constant.int 1 %2987 = torch.aten.slice.Tensor %2727, %int0_3356, %int0_3357, %int9223372036854775807_3358, %int1_3359 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3360 = torch.constant.int 1 %int0_3361 = torch.constant.int 0 %int1_3362 = torch.constant.int 1 %2988 = torch.aten.slice.Tensor %2987, %int1_3360, %int0_3361, %2970, %int1_3362 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_3363 = torch.constant.bool false %2989 = torch.aten.copy %2988, %2986, %false_3363 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_3364 = torch.constant.int 0 %int0_3365 = torch.constant.int 0 %int9223372036854775807_3366 = torch.constant.int 9223372036854775807 %int1_3367 = torch.constant.int 1 %2990 = torch.aten.slice.Tensor %2727, %int0_3364, %int0_3365, %int9223372036854775807_3366, %int1_3367 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3368 = torch.constant.int 1 %int0_3369 = torch.constant.int 0 %int1_3370 = torch.constant.int 1 %2991 = torch.aten.slice_scatter %2990, %2989, %int1_3368, %int0_3369, %2970, %int1_3370 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_3371 = torch.constant.int 0 %int0_3372 = torch.constant.int 0 %int9223372036854775807_3373 = torch.constant.int 9223372036854775807 %int1_3374 = torch.constant.int 1 %2992 = torch.aten.slice_scatter %2727, %2991, %int0_3371, %int0_3372, %int9223372036854775807_3373, %int1_3374 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_3375 = torch.constant.int 0 %int0_3376 = torch.constant.int 0 %int9223372036854775807_3377 = torch.constant.int 9223372036854775807 %int1_3378 = torch.constant.int 1 %2993 = torch.aten.slice.Tensor %671, %int0_3375, %int0_3376, %int9223372036854775807_3377, %int1_3378 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3379 = torch.constant.int 1 %int0_3380 = torch.constant.int 0 %int1_3381 = torch.constant.int 1 %2994 = torch.aten.slice.Tensor %2993, %int1_3379, %int0_3380, %2970, %int1_3381 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_3382 = torch.constant.int 0 %int0_3383 = torch.constant.int 0 %int9223372036854775807_3384 = torch.constant.int 9223372036854775807 %int1_3385 = torch.constant.int 1 %2995 = torch.aten.slice.Tensor %673, %int0_3382, %int0_3383, %int9223372036854775807_3384, %int1_3385 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3386 = torch.constant.int 1 %int0_3387 = torch.constant.int 0 %int1_3388 = torch.constant.int 1 %2996 = torch.aten.slice.Tensor %2995, %int1_3386, %int0_3387, %2970, %int1_3388 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_3389 = torch.constant.int 1 %int2_3390 = torch.constant.int 2 %2997 = torch.aten.transpose.int %2833, %int1_3389, %int2_3390 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_3391 = torch.constant.int 4 %int32_3392 = torch.constant.int 32 %int1_3393 = torch.constant.int 1 %int100_3394 = torch.constant.int 100 %2998 = torch.prim.ListConstruct %int4_3391, %int32_3392, %int1_3393, %int100_3394 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3395 = torch.constant.bool false %2999 = torch.aten.expand %2997, %2998, %false_3395 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_3396 = torch.constant.int 128 %int1_3397 = torch.constant.int 1 %int100_3398 = torch.constant.int 100 %3000 = torch.prim.ListConstruct %int128_3396, %int1_3397, %int100_3398 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3001 = torch.aten.view %2999, %3000 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_3399 = torch.constant.int 0 %int0_3400 = torch.constant.int 0 %int9223372036854775807_3401 = torch.constant.int 9223372036854775807 %int1_3402 = torch.constant.int 1 %3002 = torch.aten.slice.Tensor %2975, %int0_3399, %int0_3400, %int9223372036854775807_3401, %int1_3402 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3403 = torch.constant.int 1 %int0_3404 = torch.constant.int 0 %int1_3405 = torch.constant.int 1 %3003 = torch.aten.slice.Tensor %3002, %int1_3403, %int0_3404, %2970, %int1_3405 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_3406 = torch.constant.int 1 %int2_3407 = torch.constant.int 2 %3004 = torch.aten.transpose.int %3003, %int1_3406, %int2_3407 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_3408 = torch.constant.int 2 %int3_3409 = torch.constant.int 3 %3005 = torch.aten.transpose.int %3004, %int2_3408, %int3_3409 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_3410 = torch.constant.int 1 %3006 = torch.aten.size.int %2994, %int1_3410 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_3411 = torch.constant.int 4 %int32_3412 = torch.constant.int 32 %int100_3413 = torch.constant.int 100 %3007 = torch.prim.ListConstruct %int4_3411, %int32_3412, %int100_3413, %3006 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3414 = torch.constant.bool false %3008 = torch.aten.expand %3005, %3007, %false_3414 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_3415 = torch.constant.int 0 %3009 = torch.aten.clone %3008, %int0_3415 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_3416 = torch.constant.int 128 %int100_3417 = torch.constant.int 100 %3010 = torch.prim.ListConstruct %int128_3416, %int100_3417, %3006 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3011 = torch.aten._unsafe_view %3009, %3010 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %3012 = torch.aten.bmm %3001, %3011 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_3418 = torch.constant.int 4 %int32_3419 = torch.constant.int 32 %int1_3420 = torch.constant.int 1 %3013 = torch.prim.ListConstruct %int4_3418, %int32_3419, %int1_3420, %3006 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3014 = torch.aten.view %3012, %3013 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_3421 = torch.constant.float 1.000000e+01 %3015 = torch.aten.div.Scalar %3014, %float1.000000e01_3421 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_3422 = torch.constant.int 1 %3016 = torch.aten.add.Tensor %3015, %895, %int1_3422 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_3423 = torch.constant.int -1 %false_3424 = torch.constant.bool false %3017 = torch.aten._softmax %3016, %int-1_3423, %false_3424 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_3425 = torch.constant.int 4 %int32_3426 = torch.constant.int 32 %int1_3427 = torch.constant.int 1 %3018 = torch.prim.ListConstruct %int4_3425, %int32_3426, %int1_3427, %3006 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3428 = torch.constant.bool false %3019 = torch.aten.expand %3017, %3018, %false_3428 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_3429 = torch.constant.int 128 %int1_3430 = torch.constant.int 1 %3020 = torch.prim.ListConstruct %int128_3429, %int1_3430, %3006 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3021 = torch.aten.view %3019, %3020 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_3431 = torch.constant.int 0 %int0_3432 = torch.constant.int 0 %int9223372036854775807_3433 = torch.constant.int 9223372036854775807 %int1_3434 = torch.constant.int 1 %3022 = torch.aten.slice.Tensor %2992, %int0_3431, %int0_3432, %int9223372036854775807_3433, %int1_3434 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3435 = torch.constant.int 1 %int0_3436 = torch.constant.int 0 %int1_3437 = torch.constant.int 1 %3023 = torch.aten.slice.Tensor %3022, %int1_3435, %int0_3436, %2970, %int1_3437 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_3438 = torch.constant.int 1 %int2_3439 = torch.constant.int 2 %3024 = torch.aten.transpose.int %3023, %int1_3438, %int2_3439 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_3440 = torch.constant.int 1 %3025 = torch.aten.size.int %2996, %int1_3440 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_3441 = torch.constant.int 4 %int32_3442 = torch.constant.int 32 %int100_3443 = torch.constant.int 100 %3026 = torch.prim.ListConstruct %int4_3441, %int32_3442, %3025, %int100_3443 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3444 = torch.constant.bool false %3027 = torch.aten.expand %3024, %3026, %false_3444 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_3445 = torch.constant.int 0 %3028 = torch.aten.clone %3027, %int0_3445 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_3446 = torch.constant.int 128 %int100_3447 = torch.constant.int 100 %3029 = torch.prim.ListConstruct %int128_3446, %3025, %int100_3447 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3030 = torch.aten._unsafe_view %3028, %3029 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %3031 = torch.aten.bmm %3021, %3030 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_3448 = torch.constant.int 4 %int32_3449 = torch.constant.int 32 %int1_3450 = torch.constant.int 1 %int100_3451 = torch.constant.int 100 %3032 = torch.prim.ListConstruct %int4_3448, %int32_3449, %int1_3450, %int100_3451 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3033 = torch.aten.view %3031, %3032 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_3452 = torch.constant.int 1 %int2_3453 = torch.constant.int 2 %3034 = torch.aten.transpose.int %3033, %int1_3452, %int2_3453 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_3454 = torch.constant.int 4 %int1_3455 = torch.constant.int 1 %int-1_3456 = torch.constant.int -1 %3035 = torch.prim.ListConstruct %int4_3454, %int1_3455, %int-1_3456 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3036 = torch.aten.view %3034, %3035 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %3037 = torch_c.to_builtin_tensor %3036 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3457 = tensor.cast %3037 : tensor<4x1x3200xf32> to tensor %3038 = torch_c.to_builtin_tensor %78 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3039 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3457, %3038) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3458 = tensor.cast %3039 : tensor to tensor<4x1x3200xf32> %3040 = torch_c.from_builtin_tensor %cast_3458 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_3459 = torch.constant.int 1 %3041 = torch.aten.add.Tensor %2798, %3040, %int1_3459 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_3460 = torch.constant.int 2 %3042 = torch.aten.pow.Tensor_Scalar %3041, %int2_3460 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_3461 = torch.constant.int -1 %3043 = torch.prim.ListConstruct %int-1_3461 : (!torch.int) -> !torch.list %true_3462 = torch.constant.bool true %none_3463 = torch.constant.none %3044 = torch.aten.mean.dim %3042, %3043, %true_3462, %none_3463 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_3464 = torch.constant.float 9.9999999747524271E-7 %int1_3465 = torch.constant.int 1 %3045 = torch.aten.add.Scalar %3044, %float9.999990e-07_3464, %int1_3465 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %3046 = torch.aten.rsqrt %3045 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %3047 = torch.aten.mul.Tensor %3041, %3046 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %3048 = torch.aten.mul.Tensor %3047, %79 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %3049 = torch_c.to_builtin_tensor %3048 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3466 = tensor.cast %3049 : tensor<4x1x3200xf32> to tensor %3050 = torch_c.to_builtin_tensor %80 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %3051 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_3466, %3050) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_3467 = tensor.cast %3051 : tensor to tensor<4x1x8640xf32> %3052 = torch_c.from_builtin_tensor %cast_3467 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %3053 = torch.aten.silu %3052 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %3054 = torch_c.to_builtin_tensor %3048 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3468 = tensor.cast %3054 : tensor<4x1x3200xf32> to tensor %3055 = torch_c.to_builtin_tensor %81 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %3056 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_3468, %3055) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_3469 = tensor.cast %3056 : tensor to tensor<4x1x8640xf32> %3057 = torch_c.from_builtin_tensor %cast_3469 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %3058 = torch.aten.mul.Tensor %3053, %3057 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %3059 = torch_c.to_builtin_tensor %3058 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_3470 = tensor.cast %3059 : tensor<4x1x8640xf32> to tensor %3060 = torch_c.to_builtin_tensor %82 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %3061 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_3470, %3060) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_3471 = tensor.cast %3061 : tensor to tensor<4x1x3200xf32> %3062 = torch_c.from_builtin_tensor %cast_3471 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_3472 = torch.constant.int 1 %3063 = torch.aten.add.Tensor %3041, %3062, %int1_3472 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_3473 = torch.constant.int 2 %3064 = torch.aten.pow.Tensor_Scalar %3063, %int2_3473 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_3474 = torch.constant.int -1 %3065 = torch.prim.ListConstruct %int-1_3474 : (!torch.int) -> !torch.list %true_3475 = torch.constant.bool true %none_3476 = torch.constant.none %3066 = torch.aten.mean.dim %3064, %3065, %true_3475, %none_3476 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_3477 = torch.constant.float 9.9999999747524271E-7 %int1_3478 = torch.constant.int 1 %3067 = torch.aten.add.Scalar %3066, %float9.999990e-07_3477, %int1_3478 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %3068 = torch.aten.rsqrt %3067 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %3069 = torch.aten.mul.Tensor %3063, %3068 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %3070 = torch.aten.mul.Tensor %3069, %83 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %3071 = torch_c.to_builtin_tensor %3070 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3479 = tensor.cast %3071 : tensor<4x1x3200xf32> to tensor %3072 = torch_c.to_builtin_tensor %84 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3073 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3479, %3072) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3480 = tensor.cast %3073 : tensor to tensor<4x1x3200xf32> %3074 = torch_c.from_builtin_tensor %cast_3480 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %3075 = torch_c.to_builtin_tensor %3070 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3481 = tensor.cast %3075 : tensor<4x1x3200xf32> to tensor %3076 = torch_c.to_builtin_tensor %85 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3077 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3481, %3076) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3482 = tensor.cast %3077 : tensor to tensor<4x1x3200xf32> %3078 = torch_c.from_builtin_tensor %cast_3482 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %3079 = torch_c.to_builtin_tensor %3070 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3483 = tensor.cast %3079 : tensor<4x1x3200xf32> to tensor %3080 = torch_c.to_builtin_tensor %86 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3081 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3483, %3080) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3484 = tensor.cast %3081 : tensor to tensor<4x1x3200xf32> %3082 = torch_c.from_builtin_tensor %cast_3484 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_3485 = torch.constant.int 4 %int1_3486 = torch.constant.int 1 %int32_3487 = torch.constant.int 32 %int100_3488 = torch.constant.int 100 %3083 = torch.prim.ListConstruct %int4_3485, %int1_3486, %int32_3487, %int100_3488 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3084 = torch.aten.view %3074, %3083 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_3489 = torch.constant.int 4 %int1_3490 = torch.constant.int 1 %int32_3491 = torch.constant.int 32 %int100_3492 = torch.constant.int 100 %3085 = torch.prim.ListConstruct %int4_3489, %int1_3490, %int32_3491, %int100_3492 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3086 = torch.aten.view %3078, %3085 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_3493 = torch.constant.int 4 %int1_3494 = torch.constant.int 1 %int32_3495 = torch.constant.int 32 %int100_3496 = torch.constant.int 100 %3087 = torch.prim.ListConstruct %int4_3493, %int1_3494, %int32_3495, %int100_3496 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3088 = torch.aten.view %3082, %3087 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_3497 = torch.constant.int 4 %int1_3498 = torch.constant.int 1 %int32_3499 = torch.constant.int 32 %int-1_3500 = torch.constant.int -1 %int2_3501 = torch.constant.int 2 %3089 = torch.prim.ListConstruct %int4_3497, %int1_3498, %int32_3499, %int-1_3500, %int2_3501 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3090 = torch.aten.view %3084, %3089 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %3091 = torch.aten.view_as_complex %3090 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_3502 = torch.constant.int 4 %int1_3503 = torch.constant.int 1 %int32_3504 = torch.constant.int 32 %int-1_3505 = torch.constant.int -1 %int2_3506 = torch.constant.int 2 %3092 = torch.prim.ListConstruct %int4_3502, %int1_3503, %int32_3504, %int-1_3505, %int2_3506 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3093 = torch.aten.view %3086, %3092 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %3094 = torch.aten.view_as_complex %3093 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %3095 = torch.aten.mul.Tensor %3091, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %3096 = torch.aten.view_as_real %3095 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_3507 = torch.constant.int 4 %int1_3508 = torch.constant.int 1 %int32_3509 = torch.constant.int 32 %int100_3510 = torch.constant.int 100 %3097 = torch.prim.ListConstruct %int4_3507, %int1_3508, %int32_3509, %int100_3510 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3098 = torch.aten.view %3096, %3097 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %3099 = torch.aten.mul.Tensor %3094, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %3100 = torch.aten.view_as_real %3099 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_3511 = torch.constant.int 4 %int1_3512 = torch.constant.int 1 %int32_3513 = torch.constant.int 32 %int100_3514 = torch.constant.int 100 %3101 = torch.prim.ListConstruct %int4_3511, %int1_3512, %int32_3513, %int100_3514 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3102 = torch.aten.view %3100, %3101 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_3515 = torch.constant.int 1 %int1_3516 = torch.constant.int 1 %3103 = torch.aten.add.Scalar %arg2, %int1_3515, %int1_3516 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_3517 = torch.constant.int 0 %int0_3518 = torch.constant.int 0 %3104 = torch.aten.select.int %3103, %int0_3517, %int0_3518 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3519 = torch.constant.int 0 %int0_3520 = torch.constant.int 0 %3105 = torch.aten.select.int %arg3, %int0_3519, %int0_3520 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3521 = torch.constant.int 0 %int0_3522 = torch.constant.int 0 %int9223372036854775807_3523 = torch.constant.int 9223372036854775807 %int1_3524 = torch.constant.int 1 %3106 = torch.aten.slice.Tensor %3105, %int0_3521, %int0_3522, %int9223372036854775807_3523, %int1_3524 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3525 = torch.constant.int 16 %3107 = torch.aten.floor_divide.Scalar %3104, %int16_3525 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3526 = torch.constant.int 0 %3108 = torch.aten.index_select %3106, %int0_3526, %3107 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3527 = torch.constant.int 16 %3109 = torch.aten.remainder.Scalar %3104, %int16_3527 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3528 = torch.constant.none %3110 = torch.aten.clone %382, %none_3528 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3529 = torch.constant.none %3111 = torch.aten.clone %383, %none_3529 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3530 = torch.constant.int 0 %3112 = torch.aten.unsqueeze %3109, %int0_3530 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3531 = torch.constant.int 0 %int0_3532 = torch.constant.int 0 %3113 = torch.aten.select.int %3102, %int0_3531, %int0_3532 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3533 = torch.constant.int 0 %int0_3534 = torch.constant.int 0 %3114 = torch.aten.select.int %3113, %int0_3533, %int0_3534 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_3535 = torch.constant.int -1 %int26_3536 = torch.constant.int 26 %int2_3537 = torch.constant.int 2 %int16_3538 = torch.constant.int 16 %int32_3539 = torch.constant.int 32 %int100_3540 = torch.constant.int 100 %3115 = torch.prim.ListConstruct %int-1_3535, %int26_3536, %int2_3537, %int16_3538, %int32_3539, %int100_3540 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3116 = torch.aten.view %2950, %3115 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %3117 = torch.prim.ListConstruct %3108, %3110, %3111, %3112 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3541 = torch.constant.bool false %3118 = torch.aten.index_put %3116, %3117, %3114, %false_3541 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3542 = torch.constant.int 2662400 %3119 = torch.prim.ListConstruct %731, %int2662400_3542 : (!torch.int, !torch.int) -> !torch.list %3120 = torch.aten.view %3118, %3119 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3543 = torch.constant.int -1 %int26_3544 = torch.constant.int 26 %int2_3545 = torch.constant.int 2 %int16_3546 = torch.constant.int 16 %int32_3547 = torch.constant.int 32 %int100_3548 = torch.constant.int 100 %3121 = torch.prim.ListConstruct %int-1_3543, %int26_3544, %int2_3545, %int16_3546, %int32_3547, %int100_3548 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3122 = torch.aten.view %3120, %3121 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3549 = torch.constant.none %3123 = torch.aten.clone %384, %none_3549 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3550 = torch.constant.none %3124 = torch.aten.clone %385, %none_3550 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3551 = torch.constant.int 0 %3125 = torch.aten.unsqueeze %3109, %int0_3551 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3552 = torch.constant.int 0 %int0_3553 = torch.constant.int 0 %3126 = torch.aten.select.int %3088, %int0_3552, %int0_3553 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3554 = torch.constant.int 0 %int0_3555 = torch.constant.int 0 %3127 = torch.aten.select.int %3126, %int0_3554, %int0_3555 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3128 = torch.prim.ListConstruct %3108, %3123, %3124, %3125 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3556 = torch.constant.bool false %3129 = torch.aten.index_put %3122, %3128, %3127, %false_3556 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3557 = torch.constant.int 2662400 %3130 = torch.prim.ListConstruct %731, %int2662400_3557 : (!torch.int, !torch.int) -> !torch.list %3131 = torch.aten.view %3129, %3130 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3558 = torch.constant.int -1 %int26_3559 = torch.constant.int 26 %int2_3560 = torch.constant.int 2 %int16_3561 = torch.constant.int 16 %int32_3562 = torch.constant.int 32 %int100_3563 = torch.constant.int 100 %3132 = torch.prim.ListConstruct %int-1_3558, %int26_3559, %int2_3560, %int16_3561, %int32_3562, %int100_3563 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3133 = torch.aten.view %3131, %3132 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_3564 = torch.constant.int 0 %int1_3565 = torch.constant.int 1 %3134 = torch.aten.select.int %3103, %int0_3564, %int1_3565 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3566 = torch.constant.int 0 %int1_3567 = torch.constant.int 1 %3135 = torch.aten.select.int %arg3, %int0_3566, %int1_3567 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3568 = torch.constant.int 0 %int0_3569 = torch.constant.int 0 %int9223372036854775807_3570 = torch.constant.int 9223372036854775807 %int1_3571 = torch.constant.int 1 %3136 = torch.aten.slice.Tensor %3135, %int0_3568, %int0_3569, %int9223372036854775807_3570, %int1_3571 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3572 = torch.constant.int 16 %3137 = torch.aten.floor_divide.Scalar %3134, %int16_3572 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3573 = torch.constant.int 0 %3138 = torch.aten.index_select %3136, %int0_3573, %3137 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3574 = torch.constant.int 16 %3139 = torch.aten.remainder.Scalar %3134, %int16_3574 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3575 = torch.constant.none %3140 = torch.aten.clone %386, %none_3575 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3576 = torch.constant.none %3141 = torch.aten.clone %387, %none_3576 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3577 = torch.constant.int 0 %3142 = torch.aten.unsqueeze %3139, %int0_3577 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3578 = torch.constant.int 0 %int1_3579 = torch.constant.int 1 %3143 = torch.aten.select.int %3102, %int0_3578, %int1_3579 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3580 = torch.constant.int 0 %int0_3581 = torch.constant.int 0 %3144 = torch.aten.select.int %3143, %int0_3580, %int0_3581 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3145 = torch.prim.ListConstruct %3138, %3140, %3141, %3142 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3582 = torch.constant.bool false %3146 = torch.aten.index_put %3133, %3145, %3144, %false_3582 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3583 = torch.constant.int 2662400 %3147 = torch.prim.ListConstruct %731, %int2662400_3583 : (!torch.int, !torch.int) -> !torch.list %3148 = torch.aten.view %3146, %3147 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3584 = torch.constant.int -1 %int26_3585 = torch.constant.int 26 %int2_3586 = torch.constant.int 2 %int16_3587 = torch.constant.int 16 %int32_3588 = torch.constant.int 32 %int100_3589 = torch.constant.int 100 %3149 = torch.prim.ListConstruct %int-1_3584, %int26_3585, %int2_3586, %int16_3587, %int32_3588, %int100_3589 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3150 = torch.aten.view %3148, %3149 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3590 = torch.constant.none %3151 = torch.aten.clone %388, %none_3590 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3591 = torch.constant.none %3152 = torch.aten.clone %389, %none_3591 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3592 = torch.constant.int 0 %3153 = torch.aten.unsqueeze %3139, %int0_3592 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3593 = torch.constant.int 0 %int1_3594 = torch.constant.int 1 %3154 = torch.aten.select.int %3088, %int0_3593, %int1_3594 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3595 = torch.constant.int 0 %int0_3596 = torch.constant.int 0 %3155 = torch.aten.select.int %3154, %int0_3595, %int0_3596 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3156 = torch.prim.ListConstruct %3138, %3151, %3152, %3153 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3597 = torch.constant.bool false %3157 = torch.aten.index_put %3150, %3156, %3155, %false_3597 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3598 = torch.constant.int 2662400 %3158 = torch.prim.ListConstruct %731, %int2662400_3598 : (!torch.int, !torch.int) -> !torch.list %3159 = torch.aten.view %3157, %3158 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3599 = torch.constant.int -1 %int26_3600 = torch.constant.int 26 %int2_3601 = torch.constant.int 2 %int16_3602 = torch.constant.int 16 %int32_3603 = torch.constant.int 32 %int100_3604 = torch.constant.int 100 %3160 = torch.prim.ListConstruct %int-1_3599, %int26_3600, %int2_3601, %int16_3602, %int32_3603, %int100_3604 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3161 = torch.aten.view %3159, %3160 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_3605 = torch.constant.int 0 %int2_3606 = torch.constant.int 2 %3162 = torch.aten.select.int %3103, %int0_3605, %int2_3606 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3607 = torch.constant.int 0 %int2_3608 = torch.constant.int 2 %3163 = torch.aten.select.int %arg3, %int0_3607, %int2_3608 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3609 = torch.constant.int 0 %int0_3610 = torch.constant.int 0 %int9223372036854775807_3611 = torch.constant.int 9223372036854775807 %int1_3612 = torch.constant.int 1 %3164 = torch.aten.slice.Tensor %3163, %int0_3609, %int0_3610, %int9223372036854775807_3611, %int1_3612 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3613 = torch.constant.int 16 %3165 = torch.aten.floor_divide.Scalar %3162, %int16_3613 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3614 = torch.constant.int 0 %3166 = torch.aten.index_select %3164, %int0_3614, %3165 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3615 = torch.constant.int 16 %3167 = torch.aten.remainder.Scalar %3162, %int16_3615 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3616 = torch.constant.none %3168 = torch.aten.clone %390, %none_3616 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3617 = torch.constant.none %3169 = torch.aten.clone %391, %none_3617 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3618 = torch.constant.int 0 %3170 = torch.aten.unsqueeze %3167, %int0_3618 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3619 = torch.constant.int 0 %int2_3620 = torch.constant.int 2 %3171 = torch.aten.select.int %3102, %int0_3619, %int2_3620 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3621 = torch.constant.int 0 %int0_3622 = torch.constant.int 0 %3172 = torch.aten.select.int %3171, %int0_3621, %int0_3622 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3173 = torch.prim.ListConstruct %3166, %3168, %3169, %3170 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3623 = torch.constant.bool false %3174 = torch.aten.index_put %3161, %3173, %3172, %false_3623 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3624 = torch.constant.int 2662400 %3175 = torch.prim.ListConstruct %731, %int2662400_3624 : (!torch.int, !torch.int) -> !torch.list %3176 = torch.aten.view %3174, %3175 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3625 = torch.constant.int -1 %int26_3626 = torch.constant.int 26 %int2_3627 = torch.constant.int 2 %int16_3628 = torch.constant.int 16 %int32_3629 = torch.constant.int 32 %int100_3630 = torch.constant.int 100 %3177 = torch.prim.ListConstruct %int-1_3625, %int26_3626, %int2_3627, %int16_3628, %int32_3629, %int100_3630 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3178 = torch.aten.view %3176, %3177 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3631 = torch.constant.none %3179 = torch.aten.clone %392, %none_3631 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3632 = torch.constant.none %3180 = torch.aten.clone %393, %none_3632 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3633 = torch.constant.int 0 %3181 = torch.aten.unsqueeze %3167, %int0_3633 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3634 = torch.constant.int 0 %int2_3635 = torch.constant.int 2 %3182 = torch.aten.select.int %3088, %int0_3634, %int2_3635 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3636 = torch.constant.int 0 %int0_3637 = torch.constant.int 0 %3183 = torch.aten.select.int %3182, %int0_3636, %int0_3637 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3184 = torch.prim.ListConstruct %3166, %3179, %3180, %3181 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3638 = torch.constant.bool false %3185 = torch.aten.index_put %3178, %3184, %3183, %false_3638 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3639 = torch.constant.int 2662400 %3186 = torch.prim.ListConstruct %731, %int2662400_3639 : (!torch.int, !torch.int) -> !torch.list %3187 = torch.aten.view %3185, %3186 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3640 = torch.constant.int -1 %int26_3641 = torch.constant.int 26 %int2_3642 = torch.constant.int 2 %int16_3643 = torch.constant.int 16 %int32_3644 = torch.constant.int 32 %int100_3645 = torch.constant.int 100 %3188 = torch.prim.ListConstruct %int-1_3640, %int26_3641, %int2_3642, %int16_3643, %int32_3644, %int100_3645 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3189 = torch.aten.view %3187, %3188 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_3646 = torch.constant.int 0 %int3_3647 = torch.constant.int 3 %3190 = torch.aten.select.int %3103, %int0_3646, %int3_3647 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3648 = torch.constant.int 0 %int3_3649 = torch.constant.int 3 %3191 = torch.aten.select.int %arg3, %int0_3648, %int3_3649 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3650 = torch.constant.int 0 %int0_3651 = torch.constant.int 0 %int9223372036854775807_3652 = torch.constant.int 9223372036854775807 %int1_3653 = torch.constant.int 1 %3192 = torch.aten.slice.Tensor %3191, %int0_3650, %int0_3651, %int9223372036854775807_3652, %int1_3653 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3654 = torch.constant.int 16 %3193 = torch.aten.floor_divide.Scalar %3190, %int16_3654 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3655 = torch.constant.int 0 %3194 = torch.aten.index_select %3192, %int0_3655, %3193 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3656 = torch.constant.int 16 %3195 = torch.aten.remainder.Scalar %3190, %int16_3656 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3657 = torch.constant.none %3196 = torch.aten.clone %394, %none_3657 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3658 = torch.constant.none %3197 = torch.aten.clone %395, %none_3658 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3659 = torch.constant.int 0 %3198 = torch.aten.unsqueeze %3195, %int0_3659 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3660 = torch.constant.int 0 %int3_3661 = torch.constant.int 3 %3199 = torch.aten.select.int %3102, %int0_3660, %int3_3661 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3662 = torch.constant.int 0 %int0_3663 = torch.constant.int 0 %3200 = torch.aten.select.int %3199, %int0_3662, %int0_3663 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3201 = torch.prim.ListConstruct %3194, %3196, %3197, %3198 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3664 = torch.constant.bool false %3202 = torch.aten.index_put %3189, %3201, %3200, %false_3664 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3665 = torch.constant.int 2662400 %3203 = torch.prim.ListConstruct %731, %int2662400_3665 : (!torch.int, !torch.int) -> !torch.list %3204 = torch.aten.view %3202, %3203 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3666 = torch.constant.int -1 %int26_3667 = torch.constant.int 26 %int2_3668 = torch.constant.int 2 %int16_3669 = torch.constant.int 16 %int32_3670 = torch.constant.int 32 %int100_3671 = torch.constant.int 100 %3205 = torch.prim.ListConstruct %int-1_3666, %int26_3667, %int2_3668, %int16_3669, %int32_3670, %int100_3671 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3206 = torch.aten.view %3204, %3205 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3672 = torch.constant.none %3207 = torch.aten.clone %396, %none_3672 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3673 = torch.constant.none %3208 = torch.aten.clone %397, %none_3673 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3674 = torch.constant.int 0 %3209 = torch.aten.unsqueeze %3195, %int0_3674 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3675 = torch.constant.int 0 %int3_3676 = torch.constant.int 3 %3210 = torch.aten.select.int %3088, %int0_3675, %int3_3676 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3677 = torch.constant.int 0 %int0_3678 = torch.constant.int 0 %3211 = torch.aten.select.int %3210, %int0_3677, %int0_3678 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3212 = torch.prim.ListConstruct %3194, %3207, %3208, %3209 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3679 = torch.constant.bool false %3213 = torch.aten.index_put %3206, %3212, %3211, %false_3679 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3680 = torch.constant.int 2662400 %3214 = torch.prim.ListConstruct %731, %int2662400_3680 : (!torch.int, !torch.int) -> !torch.list %3215 = torch.aten.view %3213, %3214 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_3681 = torch.constant.int 52 %3216 = torch.aten.mul.Scalar %arg3, %int52_3681 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int18 = torch.constant.int 18 %int1_3682 = torch.constant.int 1 %3217 = torch.aten.add.Scalar %3216, %int18, %int1_3682 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_3683 = torch.constant.int 4 %3218 = torch.aten.mul.int %int4_3683, %655 : !torch.int, !torch.int -> !torch.int %3219 = torch.prim.ListConstruct %3218 : (!torch.int) -> !torch.list %3220 = torch.aten.view %3217, %3219 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_3684 = torch.constant.int -1 %int26_3685 = torch.constant.int 26 %int2_3686 = torch.constant.int 2 %int16_3687 = torch.constant.int 16 %int32_3688 = torch.constant.int 32 %int100_3689 = torch.constant.int 100 %3221 = torch.prim.ListConstruct %int-1_3684, %int26_3685, %int2_3686, %int16_3687, %int32_3688, %int100_3689 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3222 = torch.aten.view %3215, %3221 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_3690 = torch.constant.int 26 %3223 = torch.aten.mul.int %731, %int26_3690 : !torch.int, !torch.int -> !torch.int %int2_3691 = torch.constant.int 2 %3224 = torch.aten.mul.int %3223, %int2_3691 : !torch.int, !torch.int -> !torch.int %int16_3692 = torch.constant.int 16 %int32_3693 = torch.constant.int 32 %int100_3694 = torch.constant.int 100 %3225 = torch.prim.ListConstruct %3224, %int16_3692, %int32_3693, %int100_3694 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3226 = torch.aten.view %3222, %3225 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_3695 = torch.constant.int 0 %3227 = torch.aten.index_select %3226, %int0_3695, %3220 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_3696 = torch.constant.int 4 %int16_3697 = torch.constant.int 16 %int32_3698 = torch.constant.int 32 %int100_3699 = torch.constant.int 100 %3228 = torch.prim.ListConstruct %int4_3696, %655, %int16_3697, %int32_3698, %int100_3699 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3229 = torch.aten.view %3227, %3228 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_3700 = torch.constant.int 1 %3230 = torch.aten.size.int %3229, %int1_3700 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_3701 = torch.constant.int 16 %3231 = torch.aten.mul.int %3230, %int16_3701 : !torch.int, !torch.int -> !torch.int %int4_3702 = torch.constant.int 4 %int32_3703 = torch.constant.int 32 %int100_3704 = torch.constant.int 100 %3232 = torch.prim.ListConstruct %int4_3702, %3231, %int32_3703, %int100_3704 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3233 = torch.aten.view %3229, %3232 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_3705 = torch.constant.int 0 %int0_3706 = torch.constant.int 0 %int9223372036854775807_3707 = torch.constant.int 9223372036854775807 %int1_3708 = torch.constant.int 1 %3234 = torch.aten.slice.Tensor %2975, %int0_3705, %int0_3706, %int9223372036854775807_3707, %int1_3708 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_3709 = torch.constant.int 16 %3235 = torch.aten.mul.int %655, %int16_3709 : !torch.int, !torch.int -> !torch.int %int1_3710 = torch.constant.int 1 %int0_3711 = torch.constant.int 0 %int1_3712 = torch.constant.int 1 %3236 = torch.aten.slice.Tensor %3234, %int1_3710, %int0_3711, %3235, %int1_3712 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_3713 = torch.constant.bool false %3237 = torch.aten.copy %3236, %3233, %false_3713 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_3714 = torch.constant.int 0 %int0_3715 = torch.constant.int 0 %int9223372036854775807_3716 = torch.constant.int 9223372036854775807 %int1_3717 = torch.constant.int 1 %3238 = torch.aten.slice.Tensor %2975, %int0_3714, %int0_3715, %int9223372036854775807_3716, %int1_3717 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3718 = torch.constant.int 1 %int0_3719 = torch.constant.int 0 %int1_3720 = torch.constant.int 1 %3239 = torch.aten.slice_scatter %3238, %3237, %int1_3718, %int0_3719, %3235, %int1_3720 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_3721 = torch.constant.int 0 %int0_3722 = torch.constant.int 0 %int9223372036854775807_3723 = torch.constant.int 9223372036854775807 %int1_3724 = torch.constant.int 1 %3240 = torch.aten.slice_scatter %2975, %3239, %int0_3721, %int0_3722, %int9223372036854775807_3723, %int1_3724 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3725 = torch.constant.int 1 %int1_3726 = torch.constant.int 1 %3241 = torch.aten.add.Scalar %3217, %int1_3725, %int1_3726 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_3727 = torch.constant.int 4 %3242 = torch.aten.mul.int %int4_3727, %655 : !torch.int, !torch.int -> !torch.int %3243 = torch.prim.ListConstruct %3242 : (!torch.int) -> !torch.list %3244 = torch.aten.view %3241, %3243 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_3728 = torch.constant.int 0 %3245 = torch.aten.index_select %3226, %int0_3728, %3244 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_3729 = torch.constant.int 4 %int16_3730 = torch.constant.int 16 %int32_3731 = torch.constant.int 32 %int100_3732 = torch.constant.int 100 %3246 = torch.prim.ListConstruct %int4_3729, %655, %int16_3730, %int32_3731, %int100_3732 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3247 = torch.aten.view %3245, %3246 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_3733 = torch.constant.int 1 %3248 = torch.aten.size.int %3247, %int1_3733 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_3734 = torch.constant.int 16 %3249 = torch.aten.mul.int %3248, %int16_3734 : !torch.int, !torch.int -> !torch.int %int4_3735 = torch.constant.int 4 %int32_3736 = torch.constant.int 32 %int100_3737 = torch.constant.int 100 %3250 = torch.prim.ListConstruct %int4_3735, %3249, %int32_3736, %int100_3737 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3251 = torch.aten.view %3247, %3250 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_3738 = torch.constant.int 0 %int0_3739 = torch.constant.int 0 %int9223372036854775807_3740 = torch.constant.int 9223372036854775807 %int1_3741 = torch.constant.int 1 %3252 = torch.aten.slice.Tensor %2992, %int0_3738, %int0_3739, %int9223372036854775807_3740, %int1_3741 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3742 = torch.constant.int 1 %int0_3743 = torch.constant.int 0 %int1_3744 = torch.constant.int 1 %3253 = torch.aten.slice.Tensor %3252, %int1_3742, %int0_3743, %3235, %int1_3744 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_3745 = torch.constant.bool false %3254 = torch.aten.copy %3253, %3251, %false_3745 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_3746 = torch.constant.int 0 %int0_3747 = torch.constant.int 0 %int9223372036854775807_3748 = torch.constant.int 9223372036854775807 %int1_3749 = torch.constant.int 1 %3255 = torch.aten.slice.Tensor %2992, %int0_3746, %int0_3747, %int9223372036854775807_3748, %int1_3749 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3750 = torch.constant.int 1 %int0_3751 = torch.constant.int 0 %int1_3752 = torch.constant.int 1 %3256 = torch.aten.slice_scatter %3255, %3254, %int1_3750, %int0_3751, %3235, %int1_3752 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_3753 = torch.constant.int 0 %int0_3754 = torch.constant.int 0 %int9223372036854775807_3755 = torch.constant.int 9223372036854775807 %int1_3756 = torch.constant.int 1 %3257 = torch.aten.slice_scatter %2992, %3256, %int0_3753, %int0_3754, %int9223372036854775807_3755, %int1_3756 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_3757 = torch.constant.int 0 %int0_3758 = torch.constant.int 0 %int9223372036854775807_3759 = torch.constant.int 9223372036854775807 %int1_3760 = torch.constant.int 1 %3258 = torch.aten.slice.Tensor %671, %int0_3757, %int0_3758, %int9223372036854775807_3759, %int1_3760 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3761 = torch.constant.int 1 %int0_3762 = torch.constant.int 0 %int1_3763 = torch.constant.int 1 %3259 = torch.aten.slice.Tensor %3258, %int1_3761, %int0_3762, %3235, %int1_3763 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_3764 = torch.constant.int 0 %int0_3765 = torch.constant.int 0 %int9223372036854775807_3766 = torch.constant.int 9223372036854775807 %int1_3767 = torch.constant.int 1 %3260 = torch.aten.slice.Tensor %673, %int0_3764, %int0_3765, %int9223372036854775807_3766, %int1_3767 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3768 = torch.constant.int 1 %int0_3769 = torch.constant.int 0 %int1_3770 = torch.constant.int 1 %3261 = torch.aten.slice.Tensor %3260, %int1_3768, %int0_3769, %3235, %int1_3770 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_3771 = torch.constant.int 1 %int2_3772 = torch.constant.int 2 %3262 = torch.aten.transpose.int %3098, %int1_3771, %int2_3772 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_3773 = torch.constant.int 4 %int32_3774 = torch.constant.int 32 %int1_3775 = torch.constant.int 1 %int100_3776 = torch.constant.int 100 %3263 = torch.prim.ListConstruct %int4_3773, %int32_3774, %int1_3775, %int100_3776 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3777 = torch.constant.bool false %3264 = torch.aten.expand %3262, %3263, %false_3777 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_3778 = torch.constant.int 128 %int1_3779 = torch.constant.int 1 %int100_3780 = torch.constant.int 100 %3265 = torch.prim.ListConstruct %int128_3778, %int1_3779, %int100_3780 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3266 = torch.aten.view %3264, %3265 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_3781 = torch.constant.int 0 %int0_3782 = torch.constant.int 0 %int9223372036854775807_3783 = torch.constant.int 9223372036854775807 %int1_3784 = torch.constant.int 1 %3267 = torch.aten.slice.Tensor %3240, %int0_3781, %int0_3782, %int9223372036854775807_3783, %int1_3784 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3785 = torch.constant.int 1 %int0_3786 = torch.constant.int 0 %int1_3787 = torch.constant.int 1 %3268 = torch.aten.slice.Tensor %3267, %int1_3785, %int0_3786, %3235, %int1_3787 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_3788 = torch.constant.int 1 %int2_3789 = torch.constant.int 2 %3269 = torch.aten.transpose.int %3268, %int1_3788, %int2_3789 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_3790 = torch.constant.int 2 %int3_3791 = torch.constant.int 3 %3270 = torch.aten.transpose.int %3269, %int2_3790, %int3_3791 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_3792 = torch.constant.int 1 %3271 = torch.aten.size.int %3259, %int1_3792 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_3793 = torch.constant.int 4 %int32_3794 = torch.constant.int 32 %int100_3795 = torch.constant.int 100 %3272 = torch.prim.ListConstruct %int4_3793, %int32_3794, %int100_3795, %3271 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3796 = torch.constant.bool false %3273 = torch.aten.expand %3270, %3272, %false_3796 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_3797 = torch.constant.int 0 %3274 = torch.aten.clone %3273, %int0_3797 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_3798 = torch.constant.int 128 %int100_3799 = torch.constant.int 100 %3275 = torch.prim.ListConstruct %int128_3798, %int100_3799, %3271 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3276 = torch.aten._unsafe_view %3274, %3275 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %3277 = torch.aten.bmm %3266, %3276 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_3800 = torch.constant.int 4 %int32_3801 = torch.constant.int 32 %int1_3802 = torch.constant.int 1 %3278 = torch.prim.ListConstruct %int4_3800, %int32_3801, %int1_3802, %3271 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3279 = torch.aten.view %3277, %3278 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_3803 = torch.constant.float 1.000000e+01 %3280 = torch.aten.div.Scalar %3279, %float1.000000e01_3803 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_3804 = torch.constant.int 1 %3281 = torch.aten.add.Tensor %3280, %895, %int1_3804 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_3805 = torch.constant.int -1 %false_3806 = torch.constant.bool false %3282 = torch.aten._softmax %3281, %int-1_3805, %false_3806 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_3807 = torch.constant.int 4 %int32_3808 = torch.constant.int 32 %int1_3809 = torch.constant.int 1 %3283 = torch.prim.ListConstruct %int4_3807, %int32_3808, %int1_3809, %3271 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3810 = torch.constant.bool false %3284 = torch.aten.expand %3282, %3283, %false_3810 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_3811 = torch.constant.int 128 %int1_3812 = torch.constant.int 1 %3285 = torch.prim.ListConstruct %int128_3811, %int1_3812, %3271 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3286 = torch.aten.view %3284, %3285 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_3813 = torch.constant.int 0 %int0_3814 = torch.constant.int 0 %int9223372036854775807_3815 = torch.constant.int 9223372036854775807 %int1_3816 = torch.constant.int 1 %3287 = torch.aten.slice.Tensor %3257, %int0_3813, %int0_3814, %int9223372036854775807_3815, %int1_3816 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_3817 = torch.constant.int 1 %int0_3818 = torch.constant.int 0 %int1_3819 = torch.constant.int 1 %3288 = torch.aten.slice.Tensor %3287, %int1_3817, %int0_3818, %3235, %int1_3819 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_3820 = torch.constant.int 1 %int2_3821 = torch.constant.int 2 %3289 = torch.aten.transpose.int %3288, %int1_3820, %int2_3821 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_3822 = torch.constant.int 1 %3290 = torch.aten.size.int %3261, %int1_3822 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_3823 = torch.constant.int 4 %int32_3824 = torch.constant.int 32 %int100_3825 = torch.constant.int 100 %3291 = torch.prim.ListConstruct %int4_3823, %int32_3824, %3290, %int100_3825 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_3826 = torch.constant.bool false %3292 = torch.aten.expand %3289, %3291, %false_3826 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_3827 = torch.constant.int 0 %3293 = torch.aten.clone %3292, %int0_3827 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_3828 = torch.constant.int 128 %int100_3829 = torch.constant.int 100 %3294 = torch.prim.ListConstruct %int128_3828, %3290, %int100_3829 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3295 = torch.aten._unsafe_view %3293, %3294 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %3296 = torch.aten.bmm %3286, %3295 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_3830 = torch.constant.int 4 %int32_3831 = torch.constant.int 32 %int1_3832 = torch.constant.int 1 %int100_3833 = torch.constant.int 100 %3297 = torch.prim.ListConstruct %int4_3830, %int32_3831, %int1_3832, %int100_3833 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3298 = torch.aten.view %3296, %3297 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_3834 = torch.constant.int 1 %int2_3835 = torch.constant.int 2 %3299 = torch.aten.transpose.int %3298, %int1_3834, %int2_3835 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_3836 = torch.constant.int 4 %int1_3837 = torch.constant.int 1 %int-1_3838 = torch.constant.int -1 %3300 = torch.prim.ListConstruct %int4_3836, %int1_3837, %int-1_3838 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3301 = torch.aten.view %3299, %3300 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %3302 = torch_c.to_builtin_tensor %3301 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3839 = tensor.cast %3302 : tensor<4x1x3200xf32> to tensor %3303 = torch_c.to_builtin_tensor %87 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3304 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3839, %3303) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3840 = tensor.cast %3304 : tensor to tensor<4x1x3200xf32> %3305 = torch_c.from_builtin_tensor %cast_3840 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_3841 = torch.constant.int 1 %3306 = torch.aten.add.Tensor %3063, %3305, %int1_3841 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_3842 = torch.constant.int 2 %3307 = torch.aten.pow.Tensor_Scalar %3306, %int2_3842 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_3843 = torch.constant.int -1 %3308 = torch.prim.ListConstruct %int-1_3843 : (!torch.int) -> !torch.list %true_3844 = torch.constant.bool true %none_3845 = torch.constant.none %3309 = torch.aten.mean.dim %3307, %3308, %true_3844, %none_3845 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_3846 = torch.constant.float 9.9999999747524271E-7 %int1_3847 = torch.constant.int 1 %3310 = torch.aten.add.Scalar %3309, %float9.999990e-07_3846, %int1_3847 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %3311 = torch.aten.rsqrt %3310 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %3312 = torch.aten.mul.Tensor %3306, %3311 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %3313 = torch.aten.mul.Tensor %3312, %88 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %3314 = torch_c.to_builtin_tensor %3313 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3848 = tensor.cast %3314 : tensor<4x1x3200xf32> to tensor %3315 = torch_c.to_builtin_tensor %89 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %3316 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_3848, %3315) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_3849 = tensor.cast %3316 : tensor to tensor<4x1x8640xf32> %3317 = torch_c.from_builtin_tensor %cast_3849 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %3318 = torch.aten.silu %3317 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %3319 = torch_c.to_builtin_tensor %3313 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3850 = tensor.cast %3319 : tensor<4x1x3200xf32> to tensor %3320 = torch_c.to_builtin_tensor %90 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %3321 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_3850, %3320) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_3851 = tensor.cast %3321 : tensor to tensor<4x1x8640xf32> %3322 = torch_c.from_builtin_tensor %cast_3851 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %3323 = torch.aten.mul.Tensor %3318, %3322 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %3324 = torch_c.to_builtin_tensor %3323 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_3852 = tensor.cast %3324 : tensor<4x1x8640xf32> to tensor %3325 = torch_c.to_builtin_tensor %91 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %3326 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_3852, %3325) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_3853 = tensor.cast %3326 : tensor to tensor<4x1x3200xf32> %3327 = torch_c.from_builtin_tensor %cast_3853 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_3854 = torch.constant.int 1 %3328 = torch.aten.add.Tensor %3306, %3327, %int1_3854 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_3855 = torch.constant.int 2 %3329 = torch.aten.pow.Tensor_Scalar %3328, %int2_3855 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_3856 = torch.constant.int -1 %3330 = torch.prim.ListConstruct %int-1_3856 : (!torch.int) -> !torch.list %true_3857 = torch.constant.bool true %none_3858 = torch.constant.none %3331 = torch.aten.mean.dim %3329, %3330, %true_3857, %none_3858 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_3859 = torch.constant.float 9.9999999747524271E-7 %int1_3860 = torch.constant.int 1 %3332 = torch.aten.add.Scalar %3331, %float9.999990e-07_3859, %int1_3860 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %3333 = torch.aten.rsqrt %3332 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %3334 = torch.aten.mul.Tensor %3328, %3333 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %3335 = torch.aten.mul.Tensor %3334, %92 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %3336 = torch_c.to_builtin_tensor %3335 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3861 = tensor.cast %3336 : tensor<4x1x3200xf32> to tensor %3337 = torch_c.to_builtin_tensor %93 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3338 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3861, %3337) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3862 = tensor.cast %3338 : tensor to tensor<4x1x3200xf32> %3339 = torch_c.from_builtin_tensor %cast_3862 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %3340 = torch_c.to_builtin_tensor %3335 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3863 = tensor.cast %3340 : tensor<4x1x3200xf32> to tensor %3341 = torch_c.to_builtin_tensor %94 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3342 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3863, %3341) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3864 = tensor.cast %3342 : tensor to tensor<4x1x3200xf32> %3343 = torch_c.from_builtin_tensor %cast_3864 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %3344 = torch_c.to_builtin_tensor %3335 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_3865 = tensor.cast %3344 : tensor<4x1x3200xf32> to tensor %3345 = torch_c.to_builtin_tensor %95 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3346 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_3865, %3345) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_3866 = tensor.cast %3346 : tensor to tensor<4x1x3200xf32> %3347 = torch_c.from_builtin_tensor %cast_3866 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_3867 = torch.constant.int 4 %int1_3868 = torch.constant.int 1 %int32_3869 = torch.constant.int 32 %int100_3870 = torch.constant.int 100 %3348 = torch.prim.ListConstruct %int4_3867, %int1_3868, %int32_3869, %int100_3870 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3349 = torch.aten.view %3339, %3348 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_3871 = torch.constant.int 4 %int1_3872 = torch.constant.int 1 %int32_3873 = torch.constant.int 32 %int100_3874 = torch.constant.int 100 %3350 = torch.prim.ListConstruct %int4_3871, %int1_3872, %int32_3873, %int100_3874 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3351 = torch.aten.view %3343, %3350 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_3875 = torch.constant.int 4 %int1_3876 = torch.constant.int 1 %int32_3877 = torch.constant.int 32 %int100_3878 = torch.constant.int 100 %3352 = torch.prim.ListConstruct %int4_3875, %int1_3876, %int32_3877, %int100_3878 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3353 = torch.aten.view %3347, %3352 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_3879 = torch.constant.int 4 %int1_3880 = torch.constant.int 1 %int32_3881 = torch.constant.int 32 %int-1_3882 = torch.constant.int -1 %int2_3883 = torch.constant.int 2 %3354 = torch.prim.ListConstruct %int4_3879, %int1_3880, %int32_3881, %int-1_3882, %int2_3883 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3355 = torch.aten.view %3349, %3354 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %3356 = torch.aten.view_as_complex %3355 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_3884 = torch.constant.int 4 %int1_3885 = torch.constant.int 1 %int32_3886 = torch.constant.int 32 %int-1_3887 = torch.constant.int -1 %int2_3888 = torch.constant.int 2 %3357 = torch.prim.ListConstruct %int4_3884, %int1_3885, %int32_3886, %int-1_3887, %int2_3888 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3358 = torch.aten.view %3351, %3357 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %3359 = torch.aten.view_as_complex %3358 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %3360 = torch.aten.mul.Tensor %3356, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %3361 = torch.aten.view_as_real %3360 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_3889 = torch.constant.int 4 %int1_3890 = torch.constant.int 1 %int32_3891 = torch.constant.int 32 %int100_3892 = torch.constant.int 100 %3362 = torch.prim.ListConstruct %int4_3889, %int1_3890, %int32_3891, %int100_3892 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3363 = torch.aten.view %3361, %3362 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %3364 = torch.aten.mul.Tensor %3359, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %3365 = torch.aten.view_as_real %3364 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_3893 = torch.constant.int 4 %int1_3894 = torch.constant.int 1 %int32_3895 = torch.constant.int 32 %int100_3896 = torch.constant.int 100 %3366 = torch.prim.ListConstruct %int4_3893, %int1_3894, %int32_3895, %int100_3896 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3367 = torch.aten.view %3365, %3366 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_3897 = torch.constant.int 1 %int1_3898 = torch.constant.int 1 %3368 = torch.aten.add.Scalar %arg2, %int1_3897, %int1_3898 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_3899 = torch.constant.int 0 %int0_3900 = torch.constant.int 0 %3369 = torch.aten.select.int %3368, %int0_3899, %int0_3900 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3901 = torch.constant.int 0 %int0_3902 = torch.constant.int 0 %3370 = torch.aten.select.int %arg3, %int0_3901, %int0_3902 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3903 = torch.constant.int 0 %int0_3904 = torch.constant.int 0 %int9223372036854775807_3905 = torch.constant.int 9223372036854775807 %int1_3906 = torch.constant.int 1 %3371 = torch.aten.slice.Tensor %3370, %int0_3903, %int0_3904, %int9223372036854775807_3905, %int1_3906 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3907 = torch.constant.int 16 %3372 = torch.aten.floor_divide.Scalar %3369, %int16_3907 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3908 = torch.constant.int 0 %3373 = torch.aten.index_select %3371, %int0_3908, %3372 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3909 = torch.constant.int 16 %3374 = torch.aten.remainder.Scalar %3369, %int16_3909 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3910 = torch.constant.none %3375 = torch.aten.clone %398, %none_3910 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3911 = torch.constant.none %3376 = torch.aten.clone %399, %none_3911 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3912 = torch.constant.int 0 %3377 = torch.aten.unsqueeze %3374, %int0_3912 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3913 = torch.constant.int 0 %int0_3914 = torch.constant.int 0 %3378 = torch.aten.select.int %3367, %int0_3913, %int0_3914 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3915 = torch.constant.int 0 %int0_3916 = torch.constant.int 0 %3379 = torch.aten.select.int %3378, %int0_3915, %int0_3916 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_3917 = torch.constant.int -1 %int26_3918 = torch.constant.int 26 %int2_3919 = torch.constant.int 2 %int16_3920 = torch.constant.int 16 %int32_3921 = torch.constant.int 32 %int100_3922 = torch.constant.int 100 %3380 = torch.prim.ListConstruct %int-1_3917, %int26_3918, %int2_3919, %int16_3920, %int32_3921, %int100_3922 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3381 = torch.aten.view %3215, %3380 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %3382 = torch.prim.ListConstruct %3373, %3375, %3376, %3377 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3923 = torch.constant.bool false %3383 = torch.aten.index_put %3381, %3382, %3379, %false_3923 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3924 = torch.constant.int 2662400 %3384 = torch.prim.ListConstruct %731, %int2662400_3924 : (!torch.int, !torch.int) -> !torch.list %3385 = torch.aten.view %3383, %3384 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3925 = torch.constant.int -1 %int26_3926 = torch.constant.int 26 %int2_3927 = torch.constant.int 2 %int16_3928 = torch.constant.int 16 %int32_3929 = torch.constant.int 32 %int100_3930 = torch.constant.int 100 %3386 = torch.prim.ListConstruct %int-1_3925, %int26_3926, %int2_3927, %int16_3928, %int32_3929, %int100_3930 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3387 = torch.aten.view %3385, %3386 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3931 = torch.constant.none %3388 = torch.aten.clone %400, %none_3931 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3932 = torch.constant.none %3389 = torch.aten.clone %401, %none_3932 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3933 = torch.constant.int 0 %3390 = torch.aten.unsqueeze %3374, %int0_3933 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3934 = torch.constant.int 0 %int0_3935 = torch.constant.int 0 %3391 = torch.aten.select.int %3353, %int0_3934, %int0_3935 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3936 = torch.constant.int 0 %int0_3937 = torch.constant.int 0 %3392 = torch.aten.select.int %3391, %int0_3936, %int0_3937 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3393 = torch.prim.ListConstruct %3373, %3388, %3389, %3390 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3938 = torch.constant.bool false %3394 = torch.aten.index_put %3387, %3393, %3392, %false_3938 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3939 = torch.constant.int 2662400 %3395 = torch.prim.ListConstruct %731, %int2662400_3939 : (!torch.int, !torch.int) -> !torch.list %3396 = torch.aten.view %3394, %3395 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3940 = torch.constant.int -1 %int26_3941 = torch.constant.int 26 %int2_3942 = torch.constant.int 2 %int16_3943 = torch.constant.int 16 %int32_3944 = torch.constant.int 32 %int100_3945 = torch.constant.int 100 %3397 = torch.prim.ListConstruct %int-1_3940, %int26_3941, %int2_3942, %int16_3943, %int32_3944, %int100_3945 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3398 = torch.aten.view %3396, %3397 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_3946 = torch.constant.int 0 %int1_3947 = torch.constant.int 1 %3399 = torch.aten.select.int %3368, %int0_3946, %int1_3947 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3948 = torch.constant.int 0 %int1_3949 = torch.constant.int 1 %3400 = torch.aten.select.int %arg3, %int0_3948, %int1_3949 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3950 = torch.constant.int 0 %int0_3951 = torch.constant.int 0 %int9223372036854775807_3952 = torch.constant.int 9223372036854775807 %int1_3953 = torch.constant.int 1 %3401 = torch.aten.slice.Tensor %3400, %int0_3950, %int0_3951, %int9223372036854775807_3952, %int1_3953 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3954 = torch.constant.int 16 %3402 = torch.aten.floor_divide.Scalar %3399, %int16_3954 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3955 = torch.constant.int 0 %3403 = torch.aten.index_select %3401, %int0_3955, %3402 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3956 = torch.constant.int 16 %3404 = torch.aten.remainder.Scalar %3399, %int16_3956 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3957 = torch.constant.none %3405 = torch.aten.clone %402, %none_3957 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3958 = torch.constant.none %3406 = torch.aten.clone %403, %none_3958 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3959 = torch.constant.int 0 %3407 = torch.aten.unsqueeze %3404, %int0_3959 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3960 = torch.constant.int 0 %int1_3961 = torch.constant.int 1 %3408 = torch.aten.select.int %3367, %int0_3960, %int1_3961 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3962 = torch.constant.int 0 %int0_3963 = torch.constant.int 0 %3409 = torch.aten.select.int %3408, %int0_3962, %int0_3963 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3410 = torch.prim.ListConstruct %3403, %3405, %3406, %3407 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3964 = torch.constant.bool false %3411 = torch.aten.index_put %3398, %3410, %3409, %false_3964 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3965 = torch.constant.int 2662400 %3412 = torch.prim.ListConstruct %731, %int2662400_3965 : (!torch.int, !torch.int) -> !torch.list %3413 = torch.aten.view %3411, %3412 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3966 = torch.constant.int -1 %int26_3967 = torch.constant.int 26 %int2_3968 = torch.constant.int 2 %int16_3969 = torch.constant.int 16 %int32_3970 = torch.constant.int 32 %int100_3971 = torch.constant.int 100 %3414 = torch.prim.ListConstruct %int-1_3966, %int26_3967, %int2_3968, %int16_3969, %int32_3970, %int100_3971 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3415 = torch.aten.view %3413, %3414 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_3972 = torch.constant.none %3416 = torch.aten.clone %404, %none_3972 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3973 = torch.constant.none %3417 = torch.aten.clone %405, %none_3973 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_3974 = torch.constant.int 0 %3418 = torch.aten.unsqueeze %3404, %int0_3974 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_3975 = torch.constant.int 0 %int1_3976 = torch.constant.int 1 %3419 = torch.aten.select.int %3353, %int0_3975, %int1_3976 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_3977 = torch.constant.int 0 %int0_3978 = torch.constant.int 0 %3420 = torch.aten.select.int %3419, %int0_3977, %int0_3978 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3421 = torch.prim.ListConstruct %3403, %3416, %3417, %3418 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_3979 = torch.constant.bool false %3422 = torch.aten.index_put %3415, %3421, %3420, %false_3979 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_3980 = torch.constant.int 2662400 %3423 = torch.prim.ListConstruct %731, %int2662400_3980 : (!torch.int, !torch.int) -> !torch.list %3424 = torch.aten.view %3422, %3423 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_3981 = torch.constant.int -1 %int26_3982 = torch.constant.int 26 %int2_3983 = torch.constant.int 2 %int16_3984 = torch.constant.int 16 %int32_3985 = torch.constant.int 32 %int100_3986 = torch.constant.int 100 %3425 = torch.prim.ListConstruct %int-1_3981, %int26_3982, %int2_3983, %int16_3984, %int32_3985, %int100_3986 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3426 = torch.aten.view %3424, %3425 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_3987 = torch.constant.int 0 %int2_3988 = torch.constant.int 2 %3427 = torch.aten.select.int %3368, %int0_3987, %int2_3988 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_3989 = torch.constant.int 0 %int2_3990 = torch.constant.int 2 %3428 = torch.aten.select.int %arg3, %int0_3989, %int2_3990 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_3991 = torch.constant.int 0 %int0_3992 = torch.constant.int 0 %int9223372036854775807_3993 = torch.constant.int 9223372036854775807 %int1_3994 = torch.constant.int 1 %3429 = torch.aten.slice.Tensor %3428, %int0_3991, %int0_3992, %int9223372036854775807_3993, %int1_3994 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_3995 = torch.constant.int 16 %3430 = torch.aten.floor_divide.Scalar %3427, %int16_3995 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_3996 = torch.constant.int 0 %3431 = torch.aten.index_select %3429, %int0_3996, %3430 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_3997 = torch.constant.int 16 %3432 = torch.aten.remainder.Scalar %3427, %int16_3997 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_3998 = torch.constant.none %3433 = torch.aten.clone %406, %none_3998 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_3999 = torch.constant.none %3434 = torch.aten.clone %407, %none_3999 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4000 = torch.constant.int 0 %3435 = torch.aten.unsqueeze %3432, %int0_4000 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4001 = torch.constant.int 0 %int2_4002 = torch.constant.int 2 %3436 = torch.aten.select.int %3367, %int0_4001, %int2_4002 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4003 = torch.constant.int 0 %int0_4004 = torch.constant.int 0 %3437 = torch.aten.select.int %3436, %int0_4003, %int0_4004 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3438 = torch.prim.ListConstruct %3431, %3433, %3434, %3435 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4005 = torch.constant.bool false %3439 = torch.aten.index_put %3426, %3438, %3437, %false_4005 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4006 = torch.constant.int 2662400 %3440 = torch.prim.ListConstruct %731, %int2662400_4006 : (!torch.int, !torch.int) -> !torch.list %3441 = torch.aten.view %3439, %3440 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4007 = torch.constant.int -1 %int26_4008 = torch.constant.int 26 %int2_4009 = torch.constant.int 2 %int16_4010 = torch.constant.int 16 %int32_4011 = torch.constant.int 32 %int100_4012 = torch.constant.int 100 %3442 = torch.prim.ListConstruct %int-1_4007, %int26_4008, %int2_4009, %int16_4010, %int32_4011, %int100_4012 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3443 = torch.aten.view %3441, %3442 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4013 = torch.constant.none %3444 = torch.aten.clone %408, %none_4013 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4014 = torch.constant.none %3445 = torch.aten.clone %409, %none_4014 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4015 = torch.constant.int 0 %3446 = torch.aten.unsqueeze %3432, %int0_4015 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4016 = torch.constant.int 0 %int2_4017 = torch.constant.int 2 %3447 = torch.aten.select.int %3353, %int0_4016, %int2_4017 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4018 = torch.constant.int 0 %int0_4019 = torch.constant.int 0 %3448 = torch.aten.select.int %3447, %int0_4018, %int0_4019 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3449 = torch.prim.ListConstruct %3431, %3444, %3445, %3446 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4020 = torch.constant.bool false %3450 = torch.aten.index_put %3443, %3449, %3448, %false_4020 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4021 = torch.constant.int 2662400 %3451 = torch.prim.ListConstruct %731, %int2662400_4021 : (!torch.int, !torch.int) -> !torch.list %3452 = torch.aten.view %3450, %3451 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4022 = torch.constant.int -1 %int26_4023 = torch.constant.int 26 %int2_4024 = torch.constant.int 2 %int16_4025 = torch.constant.int 16 %int32_4026 = torch.constant.int 32 %int100_4027 = torch.constant.int 100 %3453 = torch.prim.ListConstruct %int-1_4022, %int26_4023, %int2_4024, %int16_4025, %int32_4026, %int100_4027 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3454 = torch.aten.view %3452, %3453 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_4028 = torch.constant.int 0 %int3_4029 = torch.constant.int 3 %3455 = torch.aten.select.int %3368, %int0_4028, %int3_4029 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_4030 = torch.constant.int 0 %int3_4031 = torch.constant.int 3 %3456 = torch.aten.select.int %arg3, %int0_4030, %int3_4031 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_4032 = torch.constant.int 0 %int0_4033 = torch.constant.int 0 %int9223372036854775807_4034 = torch.constant.int 9223372036854775807 %int1_4035 = torch.constant.int 1 %3457 = torch.aten.slice.Tensor %3456, %int0_4032, %int0_4033, %int9223372036854775807_4034, %int1_4035 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_4036 = torch.constant.int 16 %3458 = torch.aten.floor_divide.Scalar %3455, %int16_4036 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_4037 = torch.constant.int 0 %3459 = torch.aten.index_select %3457, %int0_4037, %3458 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_4038 = torch.constant.int 16 %3460 = torch.aten.remainder.Scalar %3455, %int16_4038 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_4039 = torch.constant.none %3461 = torch.aten.clone %410, %none_4039 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4040 = torch.constant.none %3462 = torch.aten.clone %411, %none_4040 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4041 = torch.constant.int 0 %3463 = torch.aten.unsqueeze %3460, %int0_4041 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4042 = torch.constant.int 0 %int3_4043 = torch.constant.int 3 %3464 = torch.aten.select.int %3367, %int0_4042, %int3_4043 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4044 = torch.constant.int 0 %int0_4045 = torch.constant.int 0 %3465 = torch.aten.select.int %3464, %int0_4044, %int0_4045 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3466 = torch.prim.ListConstruct %3459, %3461, %3462, %3463 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4046 = torch.constant.bool false %3467 = torch.aten.index_put %3454, %3466, %3465, %false_4046 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4047 = torch.constant.int 2662400 %3468 = torch.prim.ListConstruct %731, %int2662400_4047 : (!torch.int, !torch.int) -> !torch.list %3469 = torch.aten.view %3467, %3468 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4048 = torch.constant.int -1 %int26_4049 = torch.constant.int 26 %int2_4050 = torch.constant.int 2 %int16_4051 = torch.constant.int 16 %int32_4052 = torch.constant.int 32 %int100_4053 = torch.constant.int 100 %3470 = torch.prim.ListConstruct %int-1_4048, %int26_4049, %int2_4050, %int16_4051, %int32_4052, %int100_4053 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3471 = torch.aten.view %3469, %3470 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4054 = torch.constant.none %3472 = torch.aten.clone %412, %none_4054 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4055 = torch.constant.none %3473 = torch.aten.clone %413, %none_4055 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4056 = torch.constant.int 0 %3474 = torch.aten.unsqueeze %3460, %int0_4056 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4057 = torch.constant.int 0 %int3_4058 = torch.constant.int 3 %3475 = torch.aten.select.int %3353, %int0_4057, %int3_4058 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4059 = torch.constant.int 0 %int0_4060 = torch.constant.int 0 %3476 = torch.aten.select.int %3475, %int0_4059, %int0_4060 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3477 = torch.prim.ListConstruct %3459, %3472, %3473, %3474 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4061 = torch.constant.bool false %3478 = torch.aten.index_put %3471, %3477, %3476, %false_4061 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4062 = torch.constant.int 2662400 %3479 = torch.prim.ListConstruct %731, %int2662400_4062 : (!torch.int, !torch.int) -> !torch.list %3480 = torch.aten.view %3478, %3479 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_4063 = torch.constant.int 52 %3481 = torch.aten.mul.Scalar %arg3, %int52_4063 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int20 = torch.constant.int 20 %int1_4064 = torch.constant.int 1 %3482 = torch.aten.add.Scalar %3481, %int20, %int1_4064 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_4065 = torch.constant.int 4 %3483 = torch.aten.mul.int %int4_4065, %655 : !torch.int, !torch.int -> !torch.int %3484 = torch.prim.ListConstruct %3483 : (!torch.int) -> !torch.list %3485 = torch.aten.view %3482, %3484 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_4066 = torch.constant.int -1 %int26_4067 = torch.constant.int 26 %int2_4068 = torch.constant.int 2 %int16_4069 = torch.constant.int 16 %int32_4070 = torch.constant.int 32 %int100_4071 = torch.constant.int 100 %3486 = torch.prim.ListConstruct %int-1_4066, %int26_4067, %int2_4068, %int16_4069, %int32_4070, %int100_4071 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3487 = torch.aten.view %3480, %3486 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_4072 = torch.constant.int 26 %3488 = torch.aten.mul.int %731, %int26_4072 : !torch.int, !torch.int -> !torch.int %int2_4073 = torch.constant.int 2 %3489 = torch.aten.mul.int %3488, %int2_4073 : !torch.int, !torch.int -> !torch.int %int16_4074 = torch.constant.int 16 %int32_4075 = torch.constant.int 32 %int100_4076 = torch.constant.int 100 %3490 = torch.prim.ListConstruct %3489, %int16_4074, %int32_4075, %int100_4076 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3491 = torch.aten.view %3487, %3490 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_4077 = torch.constant.int 0 %3492 = torch.aten.index_select %3491, %int0_4077, %3485 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_4078 = torch.constant.int 4 %int16_4079 = torch.constant.int 16 %int32_4080 = torch.constant.int 32 %int100_4081 = torch.constant.int 100 %3493 = torch.prim.ListConstruct %int4_4078, %655, %int16_4079, %int32_4080, %int100_4081 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3494 = torch.aten.view %3492, %3493 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_4082 = torch.constant.int 1 %3495 = torch.aten.size.int %3494, %int1_4082 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_4083 = torch.constant.int 16 %3496 = torch.aten.mul.int %3495, %int16_4083 : !torch.int, !torch.int -> !torch.int %int4_4084 = torch.constant.int 4 %int32_4085 = torch.constant.int 32 %int100_4086 = torch.constant.int 100 %3497 = torch.prim.ListConstruct %int4_4084, %3496, %int32_4085, %int100_4086 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3498 = torch.aten.view %3494, %3497 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_4087 = torch.constant.int 0 %int0_4088 = torch.constant.int 0 %int9223372036854775807_4089 = torch.constant.int 9223372036854775807 %int1_4090 = torch.constant.int 1 %3499 = torch.aten.slice.Tensor %3240, %int0_4087, %int0_4088, %int9223372036854775807_4089, %int1_4090 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_4091 = torch.constant.int 16 %3500 = torch.aten.mul.int %655, %int16_4091 : !torch.int, !torch.int -> !torch.int %int1_4092 = torch.constant.int 1 %int0_4093 = torch.constant.int 0 %int1_4094 = torch.constant.int 1 %3501 = torch.aten.slice.Tensor %3499, %int1_4092, %int0_4093, %3500, %int1_4094 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_4095 = torch.constant.bool false %3502 = torch.aten.copy %3501, %3498, %false_4095 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_4096 = torch.constant.int 0 %int0_4097 = torch.constant.int 0 %int9223372036854775807_4098 = torch.constant.int 9223372036854775807 %int1_4099 = torch.constant.int 1 %3503 = torch.aten.slice.Tensor %3240, %int0_4096, %int0_4097, %int9223372036854775807_4098, %int1_4099 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4100 = torch.constant.int 1 %int0_4101 = torch.constant.int 0 %int1_4102 = torch.constant.int 1 %3504 = torch.aten.slice_scatter %3503, %3502, %int1_4100, %int0_4101, %3500, %int1_4102 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_4103 = torch.constant.int 0 %int0_4104 = torch.constant.int 0 %int9223372036854775807_4105 = torch.constant.int 9223372036854775807 %int1_4106 = torch.constant.int 1 %3505 = torch.aten.slice_scatter %3240, %3504, %int0_4103, %int0_4104, %int9223372036854775807_4105, %int1_4106 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4107 = torch.constant.int 1 %int1_4108 = torch.constant.int 1 %3506 = torch.aten.add.Scalar %3482, %int1_4107, %int1_4108 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_4109 = torch.constant.int 4 %3507 = torch.aten.mul.int %int4_4109, %655 : !torch.int, !torch.int -> !torch.int %3508 = torch.prim.ListConstruct %3507 : (!torch.int) -> !torch.list %3509 = torch.aten.view %3506, %3508 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_4110 = torch.constant.int 0 %3510 = torch.aten.index_select %3491, %int0_4110, %3509 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_4111 = torch.constant.int 4 %int16_4112 = torch.constant.int 16 %int32_4113 = torch.constant.int 32 %int100_4114 = torch.constant.int 100 %3511 = torch.prim.ListConstruct %int4_4111, %655, %int16_4112, %int32_4113, %int100_4114 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3512 = torch.aten.view %3510, %3511 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_4115 = torch.constant.int 1 %3513 = torch.aten.size.int %3512, %int1_4115 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_4116 = torch.constant.int 16 %3514 = torch.aten.mul.int %3513, %int16_4116 : !torch.int, !torch.int -> !torch.int %int4_4117 = torch.constant.int 4 %int32_4118 = torch.constant.int 32 %int100_4119 = torch.constant.int 100 %3515 = torch.prim.ListConstruct %int4_4117, %3514, %int32_4118, %int100_4119 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3516 = torch.aten.view %3512, %3515 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_4120 = torch.constant.int 0 %int0_4121 = torch.constant.int 0 %int9223372036854775807_4122 = torch.constant.int 9223372036854775807 %int1_4123 = torch.constant.int 1 %3517 = torch.aten.slice.Tensor %3257, %int0_4120, %int0_4121, %int9223372036854775807_4122, %int1_4123 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4124 = torch.constant.int 1 %int0_4125 = torch.constant.int 0 %int1_4126 = torch.constant.int 1 %3518 = torch.aten.slice.Tensor %3517, %int1_4124, %int0_4125, %3500, %int1_4126 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_4127 = torch.constant.bool false %3519 = torch.aten.copy %3518, %3516, %false_4127 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_4128 = torch.constant.int 0 %int0_4129 = torch.constant.int 0 %int9223372036854775807_4130 = torch.constant.int 9223372036854775807 %int1_4131 = torch.constant.int 1 %3520 = torch.aten.slice.Tensor %3257, %int0_4128, %int0_4129, %int9223372036854775807_4130, %int1_4131 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4132 = torch.constant.int 1 %int0_4133 = torch.constant.int 0 %int1_4134 = torch.constant.int 1 %3521 = torch.aten.slice_scatter %3520, %3519, %int1_4132, %int0_4133, %3500, %int1_4134 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_4135 = torch.constant.int 0 %int0_4136 = torch.constant.int 0 %int9223372036854775807_4137 = torch.constant.int 9223372036854775807 %int1_4138 = torch.constant.int 1 %3522 = torch.aten.slice_scatter %3257, %3521, %int0_4135, %int0_4136, %int9223372036854775807_4137, %int1_4138 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_4139 = torch.constant.int 0 %int0_4140 = torch.constant.int 0 %int9223372036854775807_4141 = torch.constant.int 9223372036854775807 %int1_4142 = torch.constant.int 1 %3523 = torch.aten.slice.Tensor %671, %int0_4139, %int0_4140, %int9223372036854775807_4141, %int1_4142 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4143 = torch.constant.int 1 %int0_4144 = torch.constant.int 0 %int1_4145 = torch.constant.int 1 %3524 = torch.aten.slice.Tensor %3523, %int1_4143, %int0_4144, %3500, %int1_4145 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_4146 = torch.constant.int 0 %int0_4147 = torch.constant.int 0 %int9223372036854775807_4148 = torch.constant.int 9223372036854775807 %int1_4149 = torch.constant.int 1 %3525 = torch.aten.slice.Tensor %673, %int0_4146, %int0_4147, %int9223372036854775807_4148, %int1_4149 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4150 = torch.constant.int 1 %int0_4151 = torch.constant.int 0 %int1_4152 = torch.constant.int 1 %3526 = torch.aten.slice.Tensor %3525, %int1_4150, %int0_4151, %3500, %int1_4152 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_4153 = torch.constant.int 1 %int2_4154 = torch.constant.int 2 %3527 = torch.aten.transpose.int %3363, %int1_4153, %int2_4154 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_4155 = torch.constant.int 4 %int32_4156 = torch.constant.int 32 %int1_4157 = torch.constant.int 1 %int100_4158 = torch.constant.int 100 %3528 = torch.prim.ListConstruct %int4_4155, %int32_4156, %int1_4157, %int100_4158 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4159 = torch.constant.bool false %3529 = torch.aten.expand %3527, %3528, %false_4159 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_4160 = torch.constant.int 128 %int1_4161 = torch.constant.int 1 %int100_4162 = torch.constant.int 100 %3530 = torch.prim.ListConstruct %int128_4160, %int1_4161, %int100_4162 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3531 = torch.aten.view %3529, %3530 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_4163 = torch.constant.int 0 %int0_4164 = torch.constant.int 0 %int9223372036854775807_4165 = torch.constant.int 9223372036854775807 %int1_4166 = torch.constant.int 1 %3532 = torch.aten.slice.Tensor %3505, %int0_4163, %int0_4164, %int9223372036854775807_4165, %int1_4166 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4167 = torch.constant.int 1 %int0_4168 = torch.constant.int 0 %int1_4169 = torch.constant.int 1 %3533 = torch.aten.slice.Tensor %3532, %int1_4167, %int0_4168, %3500, %int1_4169 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_4170 = torch.constant.int 1 %int2_4171 = torch.constant.int 2 %3534 = torch.aten.transpose.int %3533, %int1_4170, %int2_4171 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_4172 = torch.constant.int 2 %int3_4173 = torch.constant.int 3 %3535 = torch.aten.transpose.int %3534, %int2_4172, %int3_4173 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_4174 = torch.constant.int 1 %3536 = torch.aten.size.int %3524, %int1_4174 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_4175 = torch.constant.int 4 %int32_4176 = torch.constant.int 32 %int100_4177 = torch.constant.int 100 %3537 = torch.prim.ListConstruct %int4_4175, %int32_4176, %int100_4177, %3536 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4178 = torch.constant.bool false %3538 = torch.aten.expand %3535, %3537, %false_4178 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_4179 = torch.constant.int 0 %3539 = torch.aten.clone %3538, %int0_4179 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_4180 = torch.constant.int 128 %int100_4181 = torch.constant.int 100 %3540 = torch.prim.ListConstruct %int128_4180, %int100_4181, %3536 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3541 = torch.aten._unsafe_view %3539, %3540 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %3542 = torch.aten.bmm %3531, %3541 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_4182 = torch.constant.int 4 %int32_4183 = torch.constant.int 32 %int1_4184 = torch.constant.int 1 %3543 = torch.prim.ListConstruct %int4_4182, %int32_4183, %int1_4184, %3536 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3544 = torch.aten.view %3542, %3543 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_4185 = torch.constant.float 1.000000e+01 %3545 = torch.aten.div.Scalar %3544, %float1.000000e01_4185 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_4186 = torch.constant.int 1 %3546 = torch.aten.add.Tensor %3545, %895, %int1_4186 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_4187 = torch.constant.int -1 %false_4188 = torch.constant.bool false %3547 = torch.aten._softmax %3546, %int-1_4187, %false_4188 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_4189 = torch.constant.int 4 %int32_4190 = torch.constant.int 32 %int1_4191 = torch.constant.int 1 %3548 = torch.prim.ListConstruct %int4_4189, %int32_4190, %int1_4191, %3536 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4192 = torch.constant.bool false %3549 = torch.aten.expand %3547, %3548, %false_4192 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_4193 = torch.constant.int 128 %int1_4194 = torch.constant.int 1 %3550 = torch.prim.ListConstruct %int128_4193, %int1_4194, %3536 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3551 = torch.aten.view %3549, %3550 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_4195 = torch.constant.int 0 %int0_4196 = torch.constant.int 0 %int9223372036854775807_4197 = torch.constant.int 9223372036854775807 %int1_4198 = torch.constant.int 1 %3552 = torch.aten.slice.Tensor %3522, %int0_4195, %int0_4196, %int9223372036854775807_4197, %int1_4198 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4199 = torch.constant.int 1 %int0_4200 = torch.constant.int 0 %int1_4201 = torch.constant.int 1 %3553 = torch.aten.slice.Tensor %3552, %int1_4199, %int0_4200, %3500, %int1_4201 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_4202 = torch.constant.int 1 %int2_4203 = torch.constant.int 2 %3554 = torch.aten.transpose.int %3553, %int1_4202, %int2_4203 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_4204 = torch.constant.int 1 %3555 = torch.aten.size.int %3526, %int1_4204 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_4205 = torch.constant.int 4 %int32_4206 = torch.constant.int 32 %int100_4207 = torch.constant.int 100 %3556 = torch.prim.ListConstruct %int4_4205, %int32_4206, %3555, %int100_4207 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4208 = torch.constant.bool false %3557 = torch.aten.expand %3554, %3556, %false_4208 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_4209 = torch.constant.int 0 %3558 = torch.aten.clone %3557, %int0_4209 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_4210 = torch.constant.int 128 %int100_4211 = torch.constant.int 100 %3559 = torch.prim.ListConstruct %int128_4210, %3555, %int100_4211 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3560 = torch.aten._unsafe_view %3558, %3559 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %3561 = torch.aten.bmm %3551, %3560 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_4212 = torch.constant.int 4 %int32_4213 = torch.constant.int 32 %int1_4214 = torch.constant.int 1 %int100_4215 = torch.constant.int 100 %3562 = torch.prim.ListConstruct %int4_4212, %int32_4213, %int1_4214, %int100_4215 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3563 = torch.aten.view %3561, %3562 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_4216 = torch.constant.int 1 %int2_4217 = torch.constant.int 2 %3564 = torch.aten.transpose.int %3563, %int1_4216, %int2_4217 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_4218 = torch.constant.int 4 %int1_4219 = torch.constant.int 1 %int-1_4220 = torch.constant.int -1 %3565 = torch.prim.ListConstruct %int4_4218, %int1_4219, %int-1_4220 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3566 = torch.aten.view %3564, %3565 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %3567 = torch_c.to_builtin_tensor %3566 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4221 = tensor.cast %3567 : tensor<4x1x3200xf32> to tensor %3568 = torch_c.to_builtin_tensor %96 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3569 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_4221, %3568) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_4222 = tensor.cast %3569 : tensor to tensor<4x1x3200xf32> %3570 = torch_c.from_builtin_tensor %cast_4222 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_4223 = torch.constant.int 1 %3571 = torch.aten.add.Tensor %3328, %3570, %int1_4223 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_4224 = torch.constant.int 2 %3572 = torch.aten.pow.Tensor_Scalar %3571, %int2_4224 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_4225 = torch.constant.int -1 %3573 = torch.prim.ListConstruct %int-1_4225 : (!torch.int) -> !torch.list %true_4226 = torch.constant.bool true %none_4227 = torch.constant.none %3574 = torch.aten.mean.dim %3572, %3573, %true_4226, %none_4227 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_4228 = torch.constant.float 9.9999999747524271E-7 %int1_4229 = torch.constant.int 1 %3575 = torch.aten.add.Scalar %3574, %float9.999990e-07_4228, %int1_4229 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %3576 = torch.aten.rsqrt %3575 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %3577 = torch.aten.mul.Tensor %3571, %3576 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %3578 = torch.aten.mul.Tensor %3577, %97 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %3579 = torch_c.to_builtin_tensor %3578 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4230 = tensor.cast %3579 : tensor<4x1x3200xf32> to tensor %3580 = torch_c.to_builtin_tensor %98 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %3581 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_4230, %3580) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_4231 = tensor.cast %3581 : tensor to tensor<4x1x8640xf32> %3582 = torch_c.from_builtin_tensor %cast_4231 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %3583 = torch.aten.silu %3582 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %3584 = torch_c.to_builtin_tensor %3578 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4232 = tensor.cast %3584 : tensor<4x1x3200xf32> to tensor %3585 = torch_c.to_builtin_tensor %99 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %3586 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_4232, %3585) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_4233 = tensor.cast %3586 : tensor to tensor<4x1x8640xf32> %3587 = torch_c.from_builtin_tensor %cast_4233 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %3588 = torch.aten.mul.Tensor %3583, %3587 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %3589 = torch_c.to_builtin_tensor %3588 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_4234 = tensor.cast %3589 : tensor<4x1x8640xf32> to tensor %3590 = torch_c.to_builtin_tensor %100 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %3591 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_4234, %3590) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_4235 = tensor.cast %3591 : tensor to tensor<4x1x3200xf32> %3592 = torch_c.from_builtin_tensor %cast_4235 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_4236 = torch.constant.int 1 %3593 = torch.aten.add.Tensor %3571, %3592, %int1_4236 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_4237 = torch.constant.int 2 %3594 = torch.aten.pow.Tensor_Scalar %3593, %int2_4237 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_4238 = torch.constant.int -1 %3595 = torch.prim.ListConstruct %int-1_4238 : (!torch.int) -> !torch.list %true_4239 = torch.constant.bool true %none_4240 = torch.constant.none %3596 = torch.aten.mean.dim %3594, %3595, %true_4239, %none_4240 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_4241 = torch.constant.float 9.9999999747524271E-7 %int1_4242 = torch.constant.int 1 %3597 = torch.aten.add.Scalar %3596, %float9.999990e-07_4241, %int1_4242 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %3598 = torch.aten.rsqrt %3597 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %3599 = torch.aten.mul.Tensor %3593, %3598 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %3600 = torch.aten.mul.Tensor %3599, %101 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %3601 = torch_c.to_builtin_tensor %3600 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4243 = tensor.cast %3601 : tensor<4x1x3200xf32> to tensor %3602 = torch_c.to_builtin_tensor %102 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3603 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_4243, %3602) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_4244 = tensor.cast %3603 : tensor to tensor<4x1x3200xf32> %3604 = torch_c.from_builtin_tensor %cast_4244 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %3605 = torch_c.to_builtin_tensor %3600 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4245 = tensor.cast %3605 : tensor<4x1x3200xf32> to tensor %3606 = torch_c.to_builtin_tensor %103 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3607 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_4245, %3606) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_4246 = tensor.cast %3607 : tensor to tensor<4x1x3200xf32> %3608 = torch_c.from_builtin_tensor %cast_4246 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %3609 = torch_c.to_builtin_tensor %3600 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4247 = tensor.cast %3609 : tensor<4x1x3200xf32> to tensor %3610 = torch_c.to_builtin_tensor %104 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3611 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_4247, %3610) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_4248 = tensor.cast %3611 : tensor to tensor<4x1x3200xf32> %3612 = torch_c.from_builtin_tensor %cast_4248 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_4249 = torch.constant.int 4 %int1_4250 = torch.constant.int 1 %int32_4251 = torch.constant.int 32 %int100_4252 = torch.constant.int 100 %3613 = torch.prim.ListConstruct %int4_4249, %int1_4250, %int32_4251, %int100_4252 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3614 = torch.aten.view %3604, %3613 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_4253 = torch.constant.int 4 %int1_4254 = torch.constant.int 1 %int32_4255 = torch.constant.int 32 %int100_4256 = torch.constant.int 100 %3615 = torch.prim.ListConstruct %int4_4253, %int1_4254, %int32_4255, %int100_4256 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3616 = torch.aten.view %3608, %3615 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_4257 = torch.constant.int 4 %int1_4258 = torch.constant.int 1 %int32_4259 = torch.constant.int 32 %int100_4260 = torch.constant.int 100 %3617 = torch.prim.ListConstruct %int4_4257, %int1_4258, %int32_4259, %int100_4260 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3618 = torch.aten.view %3612, %3617 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_4261 = torch.constant.int 4 %int1_4262 = torch.constant.int 1 %int32_4263 = torch.constant.int 32 %int-1_4264 = torch.constant.int -1 %int2_4265 = torch.constant.int 2 %3619 = torch.prim.ListConstruct %int4_4261, %int1_4262, %int32_4263, %int-1_4264, %int2_4265 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3620 = torch.aten.view %3614, %3619 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %3621 = torch.aten.view_as_complex %3620 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_4266 = torch.constant.int 4 %int1_4267 = torch.constant.int 1 %int32_4268 = torch.constant.int 32 %int-1_4269 = torch.constant.int -1 %int2_4270 = torch.constant.int 2 %3622 = torch.prim.ListConstruct %int4_4266, %int1_4267, %int32_4268, %int-1_4269, %int2_4270 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3623 = torch.aten.view %3616, %3622 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %3624 = torch.aten.view_as_complex %3623 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %3625 = torch.aten.mul.Tensor %3621, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %3626 = torch.aten.view_as_real %3625 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_4271 = torch.constant.int 4 %int1_4272 = torch.constant.int 1 %int32_4273 = torch.constant.int 32 %int100_4274 = torch.constant.int 100 %3627 = torch.prim.ListConstruct %int4_4271, %int1_4272, %int32_4273, %int100_4274 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3628 = torch.aten.view %3626, %3627 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %3629 = torch.aten.mul.Tensor %3624, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %3630 = torch.aten.view_as_real %3629 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_4275 = torch.constant.int 4 %int1_4276 = torch.constant.int 1 %int32_4277 = torch.constant.int 32 %int100_4278 = torch.constant.int 100 %3631 = torch.prim.ListConstruct %int4_4275, %int1_4276, %int32_4277, %int100_4278 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3632 = torch.aten.view %3630, %3631 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_4279 = torch.constant.int 1 %int1_4280 = torch.constant.int 1 %3633 = torch.aten.add.Scalar %arg2, %int1_4279, %int1_4280 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_4281 = torch.constant.int 0 %int0_4282 = torch.constant.int 0 %3634 = torch.aten.select.int %3633, %int0_4281, %int0_4282 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_4283 = torch.constant.int 0 %int0_4284 = torch.constant.int 0 %3635 = torch.aten.select.int %arg3, %int0_4283, %int0_4284 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_4285 = torch.constant.int 0 %int0_4286 = torch.constant.int 0 %int9223372036854775807_4287 = torch.constant.int 9223372036854775807 %int1_4288 = torch.constant.int 1 %3636 = torch.aten.slice.Tensor %3635, %int0_4285, %int0_4286, %int9223372036854775807_4287, %int1_4288 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_4289 = torch.constant.int 16 %3637 = torch.aten.floor_divide.Scalar %3634, %int16_4289 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_4290 = torch.constant.int 0 %3638 = torch.aten.index_select %3636, %int0_4290, %3637 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_4291 = torch.constant.int 16 %3639 = torch.aten.remainder.Scalar %3634, %int16_4291 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_4292 = torch.constant.none %3640 = torch.aten.clone %414, %none_4292 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4293 = torch.constant.none %3641 = torch.aten.clone %415, %none_4293 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4294 = torch.constant.int 0 %3642 = torch.aten.unsqueeze %3639, %int0_4294 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4295 = torch.constant.int 0 %int0_4296 = torch.constant.int 0 %3643 = torch.aten.select.int %3632, %int0_4295, %int0_4296 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4297 = torch.constant.int 0 %int0_4298 = torch.constant.int 0 %3644 = torch.aten.select.int %3643, %int0_4297, %int0_4298 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_4299 = torch.constant.int -1 %int26_4300 = torch.constant.int 26 %int2_4301 = torch.constant.int 2 %int16_4302 = torch.constant.int 16 %int32_4303 = torch.constant.int 32 %int100_4304 = torch.constant.int 100 %3645 = torch.prim.ListConstruct %int-1_4299, %int26_4300, %int2_4301, %int16_4302, %int32_4303, %int100_4304 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3646 = torch.aten.view %3480, %3645 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %3647 = torch.prim.ListConstruct %3638, %3640, %3641, %3642 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4305 = torch.constant.bool false %3648 = torch.aten.index_put %3646, %3647, %3644, %false_4305 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4306 = torch.constant.int 2662400 %3649 = torch.prim.ListConstruct %731, %int2662400_4306 : (!torch.int, !torch.int) -> !torch.list %3650 = torch.aten.view %3648, %3649 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4307 = torch.constant.int -1 %int26_4308 = torch.constant.int 26 %int2_4309 = torch.constant.int 2 %int16_4310 = torch.constant.int 16 %int32_4311 = torch.constant.int 32 %int100_4312 = torch.constant.int 100 %3651 = torch.prim.ListConstruct %int-1_4307, %int26_4308, %int2_4309, %int16_4310, %int32_4311, %int100_4312 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3652 = torch.aten.view %3650, %3651 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4313 = torch.constant.none %3653 = torch.aten.clone %416, %none_4313 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4314 = torch.constant.none %3654 = torch.aten.clone %417, %none_4314 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4315 = torch.constant.int 0 %3655 = torch.aten.unsqueeze %3639, %int0_4315 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4316 = torch.constant.int 0 %int0_4317 = torch.constant.int 0 %3656 = torch.aten.select.int %3618, %int0_4316, %int0_4317 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4318 = torch.constant.int 0 %int0_4319 = torch.constant.int 0 %3657 = torch.aten.select.int %3656, %int0_4318, %int0_4319 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3658 = torch.prim.ListConstruct %3638, %3653, %3654, %3655 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4320 = torch.constant.bool false %3659 = torch.aten.index_put %3652, %3658, %3657, %false_4320 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4321 = torch.constant.int 2662400 %3660 = torch.prim.ListConstruct %731, %int2662400_4321 : (!torch.int, !torch.int) -> !torch.list %3661 = torch.aten.view %3659, %3660 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4322 = torch.constant.int -1 %int26_4323 = torch.constant.int 26 %int2_4324 = torch.constant.int 2 %int16_4325 = torch.constant.int 16 %int32_4326 = torch.constant.int 32 %int100_4327 = torch.constant.int 100 %3662 = torch.prim.ListConstruct %int-1_4322, %int26_4323, %int2_4324, %int16_4325, %int32_4326, %int100_4327 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3663 = torch.aten.view %3661, %3662 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_4328 = torch.constant.int 0 %int1_4329 = torch.constant.int 1 %3664 = torch.aten.select.int %3633, %int0_4328, %int1_4329 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_4330 = torch.constant.int 0 %int1_4331 = torch.constant.int 1 %3665 = torch.aten.select.int %arg3, %int0_4330, %int1_4331 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_4332 = torch.constant.int 0 %int0_4333 = torch.constant.int 0 %int9223372036854775807_4334 = torch.constant.int 9223372036854775807 %int1_4335 = torch.constant.int 1 %3666 = torch.aten.slice.Tensor %3665, %int0_4332, %int0_4333, %int9223372036854775807_4334, %int1_4335 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_4336 = torch.constant.int 16 %3667 = torch.aten.floor_divide.Scalar %3664, %int16_4336 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_4337 = torch.constant.int 0 %3668 = torch.aten.index_select %3666, %int0_4337, %3667 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_4338 = torch.constant.int 16 %3669 = torch.aten.remainder.Scalar %3664, %int16_4338 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_4339 = torch.constant.none %3670 = torch.aten.clone %418, %none_4339 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4340 = torch.constant.none %3671 = torch.aten.clone %419, %none_4340 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4341 = torch.constant.int 0 %3672 = torch.aten.unsqueeze %3669, %int0_4341 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4342 = torch.constant.int 0 %int1_4343 = torch.constant.int 1 %3673 = torch.aten.select.int %3632, %int0_4342, %int1_4343 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4344 = torch.constant.int 0 %int0_4345 = torch.constant.int 0 %3674 = torch.aten.select.int %3673, %int0_4344, %int0_4345 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3675 = torch.prim.ListConstruct %3668, %3670, %3671, %3672 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4346 = torch.constant.bool false %3676 = torch.aten.index_put %3663, %3675, %3674, %false_4346 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4347 = torch.constant.int 2662400 %3677 = torch.prim.ListConstruct %731, %int2662400_4347 : (!torch.int, !torch.int) -> !torch.list %3678 = torch.aten.view %3676, %3677 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4348 = torch.constant.int -1 %int26_4349 = torch.constant.int 26 %int2_4350 = torch.constant.int 2 %int16_4351 = torch.constant.int 16 %int32_4352 = torch.constant.int 32 %int100_4353 = torch.constant.int 100 %3679 = torch.prim.ListConstruct %int-1_4348, %int26_4349, %int2_4350, %int16_4351, %int32_4352, %int100_4353 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3680 = torch.aten.view %3678, %3679 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4354 = torch.constant.none %3681 = torch.aten.clone %420, %none_4354 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4355 = torch.constant.none %3682 = torch.aten.clone %421, %none_4355 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4356 = torch.constant.int 0 %3683 = torch.aten.unsqueeze %3669, %int0_4356 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4357 = torch.constant.int 0 %int1_4358 = torch.constant.int 1 %3684 = torch.aten.select.int %3618, %int0_4357, %int1_4358 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4359 = torch.constant.int 0 %int0_4360 = torch.constant.int 0 %3685 = torch.aten.select.int %3684, %int0_4359, %int0_4360 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3686 = torch.prim.ListConstruct %3668, %3681, %3682, %3683 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4361 = torch.constant.bool false %3687 = torch.aten.index_put %3680, %3686, %3685, %false_4361 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4362 = torch.constant.int 2662400 %3688 = torch.prim.ListConstruct %731, %int2662400_4362 : (!torch.int, !torch.int) -> !torch.list %3689 = torch.aten.view %3687, %3688 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4363 = torch.constant.int -1 %int26_4364 = torch.constant.int 26 %int2_4365 = torch.constant.int 2 %int16_4366 = torch.constant.int 16 %int32_4367 = torch.constant.int 32 %int100_4368 = torch.constant.int 100 %3690 = torch.prim.ListConstruct %int-1_4363, %int26_4364, %int2_4365, %int16_4366, %int32_4367, %int100_4368 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3691 = torch.aten.view %3689, %3690 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_4369 = torch.constant.int 0 %int2_4370 = torch.constant.int 2 %3692 = torch.aten.select.int %3633, %int0_4369, %int2_4370 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_4371 = torch.constant.int 0 %int2_4372 = torch.constant.int 2 %3693 = torch.aten.select.int %arg3, %int0_4371, %int2_4372 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_4373 = torch.constant.int 0 %int0_4374 = torch.constant.int 0 %int9223372036854775807_4375 = torch.constant.int 9223372036854775807 %int1_4376 = torch.constant.int 1 %3694 = torch.aten.slice.Tensor %3693, %int0_4373, %int0_4374, %int9223372036854775807_4375, %int1_4376 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_4377 = torch.constant.int 16 %3695 = torch.aten.floor_divide.Scalar %3692, %int16_4377 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_4378 = torch.constant.int 0 %3696 = torch.aten.index_select %3694, %int0_4378, %3695 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_4379 = torch.constant.int 16 %3697 = torch.aten.remainder.Scalar %3692, %int16_4379 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_4380 = torch.constant.none %3698 = torch.aten.clone %422, %none_4380 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4381 = torch.constant.none %3699 = torch.aten.clone %423, %none_4381 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4382 = torch.constant.int 0 %3700 = torch.aten.unsqueeze %3697, %int0_4382 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4383 = torch.constant.int 0 %int2_4384 = torch.constant.int 2 %3701 = torch.aten.select.int %3632, %int0_4383, %int2_4384 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4385 = torch.constant.int 0 %int0_4386 = torch.constant.int 0 %3702 = torch.aten.select.int %3701, %int0_4385, %int0_4386 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3703 = torch.prim.ListConstruct %3696, %3698, %3699, %3700 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4387 = torch.constant.bool false %3704 = torch.aten.index_put %3691, %3703, %3702, %false_4387 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4388 = torch.constant.int 2662400 %3705 = torch.prim.ListConstruct %731, %int2662400_4388 : (!torch.int, !torch.int) -> !torch.list %3706 = torch.aten.view %3704, %3705 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4389 = torch.constant.int -1 %int26_4390 = torch.constant.int 26 %int2_4391 = torch.constant.int 2 %int16_4392 = torch.constant.int 16 %int32_4393 = torch.constant.int 32 %int100_4394 = torch.constant.int 100 %3707 = torch.prim.ListConstruct %int-1_4389, %int26_4390, %int2_4391, %int16_4392, %int32_4393, %int100_4394 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3708 = torch.aten.view %3706, %3707 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4395 = torch.constant.none %3709 = torch.aten.clone %424, %none_4395 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4396 = torch.constant.none %3710 = torch.aten.clone %425, %none_4396 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4397 = torch.constant.int 0 %3711 = torch.aten.unsqueeze %3697, %int0_4397 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4398 = torch.constant.int 0 %int2_4399 = torch.constant.int 2 %3712 = torch.aten.select.int %3618, %int0_4398, %int2_4399 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4400 = torch.constant.int 0 %int0_4401 = torch.constant.int 0 %3713 = torch.aten.select.int %3712, %int0_4400, %int0_4401 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3714 = torch.prim.ListConstruct %3696, %3709, %3710, %3711 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4402 = torch.constant.bool false %3715 = torch.aten.index_put %3708, %3714, %3713, %false_4402 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4403 = torch.constant.int 2662400 %3716 = torch.prim.ListConstruct %731, %int2662400_4403 : (!torch.int, !torch.int) -> !torch.list %3717 = torch.aten.view %3715, %3716 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4404 = torch.constant.int -1 %int26_4405 = torch.constant.int 26 %int2_4406 = torch.constant.int 2 %int16_4407 = torch.constant.int 16 %int32_4408 = torch.constant.int 32 %int100_4409 = torch.constant.int 100 %3718 = torch.prim.ListConstruct %int-1_4404, %int26_4405, %int2_4406, %int16_4407, %int32_4408, %int100_4409 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3719 = torch.aten.view %3717, %3718 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_4410 = torch.constant.int 0 %int3_4411 = torch.constant.int 3 %3720 = torch.aten.select.int %3633, %int0_4410, %int3_4411 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_4412 = torch.constant.int 0 %int3_4413 = torch.constant.int 3 %3721 = torch.aten.select.int %arg3, %int0_4412, %int3_4413 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_4414 = torch.constant.int 0 %int0_4415 = torch.constant.int 0 %int9223372036854775807_4416 = torch.constant.int 9223372036854775807 %int1_4417 = torch.constant.int 1 %3722 = torch.aten.slice.Tensor %3721, %int0_4414, %int0_4415, %int9223372036854775807_4416, %int1_4417 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_4418 = torch.constant.int 16 %3723 = torch.aten.floor_divide.Scalar %3720, %int16_4418 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_4419 = torch.constant.int 0 %3724 = torch.aten.index_select %3722, %int0_4419, %3723 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_4420 = torch.constant.int 16 %3725 = torch.aten.remainder.Scalar %3720, %int16_4420 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_4421 = torch.constant.none %3726 = torch.aten.clone %426, %none_4421 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4422 = torch.constant.none %3727 = torch.aten.clone %427, %none_4422 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4423 = torch.constant.int 0 %3728 = torch.aten.unsqueeze %3725, %int0_4423 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4424 = torch.constant.int 0 %int3_4425 = torch.constant.int 3 %3729 = torch.aten.select.int %3632, %int0_4424, %int3_4425 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4426 = torch.constant.int 0 %int0_4427 = torch.constant.int 0 %3730 = torch.aten.select.int %3729, %int0_4426, %int0_4427 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3731 = torch.prim.ListConstruct %3724, %3726, %3727, %3728 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4428 = torch.constant.bool false %3732 = torch.aten.index_put %3719, %3731, %3730, %false_4428 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4429 = torch.constant.int 2662400 %3733 = torch.prim.ListConstruct %731, %int2662400_4429 : (!torch.int, !torch.int) -> !torch.list %3734 = torch.aten.view %3732, %3733 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4430 = torch.constant.int -1 %int26_4431 = torch.constant.int 26 %int2_4432 = torch.constant.int 2 %int16_4433 = torch.constant.int 16 %int32_4434 = torch.constant.int 32 %int100_4435 = torch.constant.int 100 %3735 = torch.prim.ListConstruct %int-1_4430, %int26_4431, %int2_4432, %int16_4433, %int32_4434, %int100_4435 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3736 = torch.aten.view %3734, %3735 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4436 = torch.constant.none %3737 = torch.aten.clone %428, %none_4436 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4437 = torch.constant.none %3738 = torch.aten.clone %429, %none_4437 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4438 = torch.constant.int 0 %3739 = torch.aten.unsqueeze %3725, %int0_4438 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4439 = torch.constant.int 0 %int3_4440 = torch.constant.int 3 %3740 = torch.aten.select.int %3618, %int0_4439, %int3_4440 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4441 = torch.constant.int 0 %int0_4442 = torch.constant.int 0 %3741 = torch.aten.select.int %3740, %int0_4441, %int0_4442 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3742 = torch.prim.ListConstruct %3724, %3737, %3738, %3739 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4443 = torch.constant.bool false %3743 = torch.aten.index_put %3736, %3742, %3741, %false_4443 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4444 = torch.constant.int 2662400 %3744 = torch.prim.ListConstruct %731, %int2662400_4444 : (!torch.int, !torch.int) -> !torch.list %3745 = torch.aten.view %3743, %3744 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_4445 = torch.constant.int 52 %3746 = torch.aten.mul.Scalar %arg3, %int52_4445 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int22 = torch.constant.int 22 %int1_4446 = torch.constant.int 1 %3747 = torch.aten.add.Scalar %3746, %int22, %int1_4446 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_4447 = torch.constant.int 4 %3748 = torch.aten.mul.int %int4_4447, %655 : !torch.int, !torch.int -> !torch.int %3749 = torch.prim.ListConstruct %3748 : (!torch.int) -> !torch.list %3750 = torch.aten.view %3747, %3749 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_4448 = torch.constant.int -1 %int26_4449 = torch.constant.int 26 %int2_4450 = torch.constant.int 2 %int16_4451 = torch.constant.int 16 %int32_4452 = torch.constant.int 32 %int100_4453 = torch.constant.int 100 %3751 = torch.prim.ListConstruct %int-1_4448, %int26_4449, %int2_4450, %int16_4451, %int32_4452, %int100_4453 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3752 = torch.aten.view %3745, %3751 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_4454 = torch.constant.int 26 %3753 = torch.aten.mul.int %731, %int26_4454 : !torch.int, !torch.int -> !torch.int %int2_4455 = torch.constant.int 2 %3754 = torch.aten.mul.int %3753, %int2_4455 : !torch.int, !torch.int -> !torch.int %int16_4456 = torch.constant.int 16 %int32_4457 = torch.constant.int 32 %int100_4458 = torch.constant.int 100 %3755 = torch.prim.ListConstruct %3754, %int16_4456, %int32_4457, %int100_4458 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3756 = torch.aten.view %3752, %3755 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_4459 = torch.constant.int 0 %3757 = torch.aten.index_select %3756, %int0_4459, %3750 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_4460 = torch.constant.int 4 %int16_4461 = torch.constant.int 16 %int32_4462 = torch.constant.int 32 %int100_4463 = torch.constant.int 100 %3758 = torch.prim.ListConstruct %int4_4460, %655, %int16_4461, %int32_4462, %int100_4463 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3759 = torch.aten.view %3757, %3758 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_4464 = torch.constant.int 1 %3760 = torch.aten.size.int %3759, %int1_4464 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_4465 = torch.constant.int 16 %3761 = torch.aten.mul.int %3760, %int16_4465 : !torch.int, !torch.int -> !torch.int %int4_4466 = torch.constant.int 4 %int32_4467 = torch.constant.int 32 %int100_4468 = torch.constant.int 100 %3762 = torch.prim.ListConstruct %int4_4466, %3761, %int32_4467, %int100_4468 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3763 = torch.aten.view %3759, %3762 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_4469 = torch.constant.int 0 %int0_4470 = torch.constant.int 0 %int9223372036854775807_4471 = torch.constant.int 9223372036854775807 %int1_4472 = torch.constant.int 1 %3764 = torch.aten.slice.Tensor %3505, %int0_4469, %int0_4470, %int9223372036854775807_4471, %int1_4472 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_4473 = torch.constant.int 16 %3765 = torch.aten.mul.int %655, %int16_4473 : !torch.int, !torch.int -> !torch.int %int1_4474 = torch.constant.int 1 %int0_4475 = torch.constant.int 0 %int1_4476 = torch.constant.int 1 %3766 = torch.aten.slice.Tensor %3764, %int1_4474, %int0_4475, %3765, %int1_4476 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_4477 = torch.constant.bool false %3767 = torch.aten.copy %3766, %3763, %false_4477 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_4478 = torch.constant.int 0 %int0_4479 = torch.constant.int 0 %int9223372036854775807_4480 = torch.constant.int 9223372036854775807 %int1_4481 = torch.constant.int 1 %3768 = torch.aten.slice.Tensor %3505, %int0_4478, %int0_4479, %int9223372036854775807_4480, %int1_4481 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4482 = torch.constant.int 1 %int0_4483 = torch.constant.int 0 %int1_4484 = torch.constant.int 1 %3769 = torch.aten.slice_scatter %3768, %3767, %int1_4482, %int0_4483, %3765, %int1_4484 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_4485 = torch.constant.int 0 %int0_4486 = torch.constant.int 0 %int9223372036854775807_4487 = torch.constant.int 9223372036854775807 %int1_4488 = torch.constant.int 1 %3770 = torch.aten.slice_scatter %3505, %3769, %int0_4485, %int0_4486, %int9223372036854775807_4487, %int1_4488 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4489 = torch.constant.int 1 %int1_4490 = torch.constant.int 1 %3771 = torch.aten.add.Scalar %3747, %int1_4489, %int1_4490 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_4491 = torch.constant.int 4 %3772 = torch.aten.mul.int %int4_4491, %655 : !torch.int, !torch.int -> !torch.int %3773 = torch.prim.ListConstruct %3772 : (!torch.int) -> !torch.list %3774 = torch.aten.view %3771, %3773 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_4492 = torch.constant.int 0 %3775 = torch.aten.index_select %3756, %int0_4492, %3774 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_4493 = torch.constant.int 4 %int16_4494 = torch.constant.int 16 %int32_4495 = torch.constant.int 32 %int100_4496 = torch.constant.int 100 %3776 = torch.prim.ListConstruct %int4_4493, %655, %int16_4494, %int32_4495, %int100_4496 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3777 = torch.aten.view %3775, %3776 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_4497 = torch.constant.int 1 %3778 = torch.aten.size.int %3777, %int1_4497 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_4498 = torch.constant.int 16 %3779 = torch.aten.mul.int %3778, %int16_4498 : !torch.int, !torch.int -> !torch.int %int4_4499 = torch.constant.int 4 %int32_4500 = torch.constant.int 32 %int100_4501 = torch.constant.int 100 %3780 = torch.prim.ListConstruct %int4_4499, %3779, %int32_4500, %int100_4501 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3781 = torch.aten.view %3777, %3780 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_4502 = torch.constant.int 0 %int0_4503 = torch.constant.int 0 %int9223372036854775807_4504 = torch.constant.int 9223372036854775807 %int1_4505 = torch.constant.int 1 %3782 = torch.aten.slice.Tensor %3522, %int0_4502, %int0_4503, %int9223372036854775807_4504, %int1_4505 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4506 = torch.constant.int 1 %int0_4507 = torch.constant.int 0 %int1_4508 = torch.constant.int 1 %3783 = torch.aten.slice.Tensor %3782, %int1_4506, %int0_4507, %3765, %int1_4508 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_4509 = torch.constant.bool false %3784 = torch.aten.copy %3783, %3781, %false_4509 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_4510 = torch.constant.int 0 %int0_4511 = torch.constant.int 0 %int9223372036854775807_4512 = torch.constant.int 9223372036854775807 %int1_4513 = torch.constant.int 1 %3785 = torch.aten.slice.Tensor %3522, %int0_4510, %int0_4511, %int9223372036854775807_4512, %int1_4513 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4514 = torch.constant.int 1 %int0_4515 = torch.constant.int 0 %int1_4516 = torch.constant.int 1 %3786 = torch.aten.slice_scatter %3785, %3784, %int1_4514, %int0_4515, %3765, %int1_4516 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_4517 = torch.constant.int 0 %int0_4518 = torch.constant.int 0 %int9223372036854775807_4519 = torch.constant.int 9223372036854775807 %int1_4520 = torch.constant.int 1 %3787 = torch.aten.slice_scatter %3522, %3786, %int0_4517, %int0_4518, %int9223372036854775807_4519, %int1_4520 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_4521 = torch.constant.int 0 %int0_4522 = torch.constant.int 0 %int9223372036854775807_4523 = torch.constant.int 9223372036854775807 %int1_4524 = torch.constant.int 1 %3788 = torch.aten.slice.Tensor %671, %int0_4521, %int0_4522, %int9223372036854775807_4523, %int1_4524 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4525 = torch.constant.int 1 %int0_4526 = torch.constant.int 0 %int1_4527 = torch.constant.int 1 %3789 = torch.aten.slice.Tensor %3788, %int1_4525, %int0_4526, %3765, %int1_4527 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_4528 = torch.constant.int 0 %int0_4529 = torch.constant.int 0 %int9223372036854775807_4530 = torch.constant.int 9223372036854775807 %int1_4531 = torch.constant.int 1 %3790 = torch.aten.slice.Tensor %673, %int0_4528, %int0_4529, %int9223372036854775807_4530, %int1_4531 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4532 = torch.constant.int 1 %int0_4533 = torch.constant.int 0 %int1_4534 = torch.constant.int 1 %3791 = torch.aten.slice.Tensor %3790, %int1_4532, %int0_4533, %3765, %int1_4534 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_4535 = torch.constant.int 1 %int2_4536 = torch.constant.int 2 %3792 = torch.aten.transpose.int %3628, %int1_4535, %int2_4536 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_4537 = torch.constant.int 4 %int32_4538 = torch.constant.int 32 %int1_4539 = torch.constant.int 1 %int100_4540 = torch.constant.int 100 %3793 = torch.prim.ListConstruct %int4_4537, %int32_4538, %int1_4539, %int100_4540 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4541 = torch.constant.bool false %3794 = torch.aten.expand %3792, %3793, %false_4541 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_4542 = torch.constant.int 128 %int1_4543 = torch.constant.int 1 %int100_4544 = torch.constant.int 100 %3795 = torch.prim.ListConstruct %int128_4542, %int1_4543, %int100_4544 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3796 = torch.aten.view %3794, %3795 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_4545 = torch.constant.int 0 %int0_4546 = torch.constant.int 0 %int9223372036854775807_4547 = torch.constant.int 9223372036854775807 %int1_4548 = torch.constant.int 1 %3797 = torch.aten.slice.Tensor %3770, %int0_4545, %int0_4546, %int9223372036854775807_4547, %int1_4548 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4549 = torch.constant.int 1 %int0_4550 = torch.constant.int 0 %int1_4551 = torch.constant.int 1 %3798 = torch.aten.slice.Tensor %3797, %int1_4549, %int0_4550, %3765, %int1_4551 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_4552 = torch.constant.int 1 %int2_4553 = torch.constant.int 2 %3799 = torch.aten.transpose.int %3798, %int1_4552, %int2_4553 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_4554 = torch.constant.int 2 %int3_4555 = torch.constant.int 3 %3800 = torch.aten.transpose.int %3799, %int2_4554, %int3_4555 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_4556 = torch.constant.int 1 %3801 = torch.aten.size.int %3789, %int1_4556 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_4557 = torch.constant.int 4 %int32_4558 = torch.constant.int 32 %int100_4559 = torch.constant.int 100 %3802 = torch.prim.ListConstruct %int4_4557, %int32_4558, %int100_4559, %3801 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4560 = torch.constant.bool false %3803 = torch.aten.expand %3800, %3802, %false_4560 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_4561 = torch.constant.int 0 %3804 = torch.aten.clone %3803, %int0_4561 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_4562 = torch.constant.int 128 %int100_4563 = torch.constant.int 100 %3805 = torch.prim.ListConstruct %int128_4562, %int100_4563, %3801 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3806 = torch.aten._unsafe_view %3804, %3805 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %3807 = torch.aten.bmm %3796, %3806 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_4564 = torch.constant.int 4 %int32_4565 = torch.constant.int 32 %int1_4566 = torch.constant.int 1 %3808 = torch.prim.ListConstruct %int4_4564, %int32_4565, %int1_4566, %3801 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3809 = torch.aten.view %3807, %3808 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_4567 = torch.constant.float 1.000000e+01 %3810 = torch.aten.div.Scalar %3809, %float1.000000e01_4567 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_4568 = torch.constant.int 1 %3811 = torch.aten.add.Tensor %3810, %895, %int1_4568 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_4569 = torch.constant.int -1 %false_4570 = torch.constant.bool false %3812 = torch.aten._softmax %3811, %int-1_4569, %false_4570 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_4571 = torch.constant.int 4 %int32_4572 = torch.constant.int 32 %int1_4573 = torch.constant.int 1 %3813 = torch.prim.ListConstruct %int4_4571, %int32_4572, %int1_4573, %3801 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4574 = torch.constant.bool false %3814 = torch.aten.expand %3812, %3813, %false_4574 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_4575 = torch.constant.int 128 %int1_4576 = torch.constant.int 1 %3815 = torch.prim.ListConstruct %int128_4575, %int1_4576, %3801 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3816 = torch.aten.view %3814, %3815 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_4577 = torch.constant.int 0 %int0_4578 = torch.constant.int 0 %int9223372036854775807_4579 = torch.constant.int 9223372036854775807 %int1_4580 = torch.constant.int 1 %3817 = torch.aten.slice.Tensor %3787, %int0_4577, %int0_4578, %int9223372036854775807_4579, %int1_4580 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4581 = torch.constant.int 1 %int0_4582 = torch.constant.int 0 %int1_4583 = torch.constant.int 1 %3818 = torch.aten.slice.Tensor %3817, %int1_4581, %int0_4582, %3765, %int1_4583 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_4584 = torch.constant.int 1 %int2_4585 = torch.constant.int 2 %3819 = torch.aten.transpose.int %3818, %int1_4584, %int2_4585 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_4586 = torch.constant.int 1 %3820 = torch.aten.size.int %3791, %int1_4586 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_4587 = torch.constant.int 4 %int32_4588 = torch.constant.int 32 %int100_4589 = torch.constant.int 100 %3821 = torch.prim.ListConstruct %int4_4587, %int32_4588, %3820, %int100_4589 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4590 = torch.constant.bool false %3822 = torch.aten.expand %3819, %3821, %false_4590 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_4591 = torch.constant.int 0 %3823 = torch.aten.clone %3822, %int0_4591 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_4592 = torch.constant.int 128 %int100_4593 = torch.constant.int 100 %3824 = torch.prim.ListConstruct %int128_4592, %3820, %int100_4593 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3825 = torch.aten._unsafe_view %3823, %3824 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %3826 = torch.aten.bmm %3816, %3825 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_4594 = torch.constant.int 4 %int32_4595 = torch.constant.int 32 %int1_4596 = torch.constant.int 1 %int100_4597 = torch.constant.int 100 %3827 = torch.prim.ListConstruct %int4_4594, %int32_4595, %int1_4596, %int100_4597 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3828 = torch.aten.view %3826, %3827 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_4598 = torch.constant.int 1 %int2_4599 = torch.constant.int 2 %3829 = torch.aten.transpose.int %3828, %int1_4598, %int2_4599 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_4600 = torch.constant.int 4 %int1_4601 = torch.constant.int 1 %int-1_4602 = torch.constant.int -1 %3830 = torch.prim.ListConstruct %int4_4600, %int1_4601, %int-1_4602 : (!torch.int, !torch.int, !torch.int) -> !torch.list %3831 = torch.aten.view %3829, %3830 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %3832 = torch_c.to_builtin_tensor %3831 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4603 = tensor.cast %3832 : tensor<4x1x3200xf32> to tensor %3833 = torch_c.to_builtin_tensor %105 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3834 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_4603, %3833) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_4604 = tensor.cast %3834 : tensor to tensor<4x1x3200xf32> %3835 = torch_c.from_builtin_tensor %cast_4604 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_4605 = torch.constant.int 1 %3836 = torch.aten.add.Tensor %3593, %3835, %int1_4605 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_4606 = torch.constant.int 2 %3837 = torch.aten.pow.Tensor_Scalar %3836, %int2_4606 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_4607 = torch.constant.int -1 %3838 = torch.prim.ListConstruct %int-1_4607 : (!torch.int) -> !torch.list %true_4608 = torch.constant.bool true %none_4609 = torch.constant.none %3839 = torch.aten.mean.dim %3837, %3838, %true_4608, %none_4609 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_4610 = torch.constant.float 9.9999999747524271E-7 %int1_4611 = torch.constant.int 1 %3840 = torch.aten.add.Scalar %3839, %float9.999990e-07_4610, %int1_4611 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %3841 = torch.aten.rsqrt %3840 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %3842 = torch.aten.mul.Tensor %3836, %3841 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %3843 = torch.aten.mul.Tensor %3842, %106 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %3844 = torch_c.to_builtin_tensor %3843 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4612 = tensor.cast %3844 : tensor<4x1x3200xf32> to tensor %3845 = torch_c.to_builtin_tensor %107 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %3846 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_4612, %3845) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_4613 = tensor.cast %3846 : tensor to tensor<4x1x8640xf32> %3847 = torch_c.from_builtin_tensor %cast_4613 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %3848 = torch.aten.silu %3847 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %3849 = torch_c.to_builtin_tensor %3843 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4614 = tensor.cast %3849 : tensor<4x1x3200xf32> to tensor %3850 = torch_c.to_builtin_tensor %108 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %3851 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_4614, %3850) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_4615 = tensor.cast %3851 : tensor to tensor<4x1x8640xf32> %3852 = torch_c.from_builtin_tensor %cast_4615 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %3853 = torch.aten.mul.Tensor %3848, %3852 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %3854 = torch_c.to_builtin_tensor %3853 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_4616 = tensor.cast %3854 : tensor<4x1x8640xf32> to tensor %3855 = torch_c.to_builtin_tensor %109 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %3856 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_4616, %3855) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_4617 = tensor.cast %3856 : tensor to tensor<4x1x3200xf32> %3857 = torch_c.from_builtin_tensor %cast_4617 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_4618 = torch.constant.int 1 %3858 = torch.aten.add.Tensor %3836, %3857, %int1_4618 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_4619 = torch.constant.int 2 %3859 = torch.aten.pow.Tensor_Scalar %3858, %int2_4619 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_4620 = torch.constant.int -1 %3860 = torch.prim.ListConstruct %int-1_4620 : (!torch.int) -> !torch.list %true_4621 = torch.constant.bool true %none_4622 = torch.constant.none %3861 = torch.aten.mean.dim %3859, %3860, %true_4621, %none_4622 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_4623 = torch.constant.float 9.9999999747524271E-7 %int1_4624 = torch.constant.int 1 %3862 = torch.aten.add.Scalar %3861, %float9.999990e-07_4623, %int1_4624 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %3863 = torch.aten.rsqrt %3862 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %3864 = torch.aten.mul.Tensor %3858, %3863 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %3865 = torch.aten.mul.Tensor %3864, %110 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %3866 = torch_c.to_builtin_tensor %3865 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4625 = tensor.cast %3866 : tensor<4x1x3200xf32> to tensor %3867 = torch_c.to_builtin_tensor %111 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3868 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_4625, %3867) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_4626 = tensor.cast %3868 : tensor to tensor<4x1x3200xf32> %3869 = torch_c.from_builtin_tensor %cast_4626 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %3870 = torch_c.to_builtin_tensor %3865 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4627 = tensor.cast %3870 : tensor<4x1x3200xf32> to tensor %3871 = torch_c.to_builtin_tensor %112 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3872 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_4627, %3871) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_4628 = tensor.cast %3872 : tensor to tensor<4x1x3200xf32> %3873 = torch_c.from_builtin_tensor %cast_4628 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %3874 = torch_c.to_builtin_tensor %3865 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4629 = tensor.cast %3874 : tensor<4x1x3200xf32> to tensor %3875 = torch_c.to_builtin_tensor %113 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %3876 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_4629, %3875) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_4630 = tensor.cast %3876 : tensor to tensor<4x1x3200xf32> %3877 = torch_c.from_builtin_tensor %cast_4630 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_4631 = torch.constant.int 4 %int1_4632 = torch.constant.int 1 %int32_4633 = torch.constant.int 32 %int100_4634 = torch.constant.int 100 %3878 = torch.prim.ListConstruct %int4_4631, %int1_4632, %int32_4633, %int100_4634 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3879 = torch.aten.view %3869, %3878 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_4635 = torch.constant.int 4 %int1_4636 = torch.constant.int 1 %int32_4637 = torch.constant.int 32 %int100_4638 = torch.constant.int 100 %3880 = torch.prim.ListConstruct %int4_4635, %int1_4636, %int32_4637, %int100_4638 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3881 = torch.aten.view %3873, %3880 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_4639 = torch.constant.int 4 %int1_4640 = torch.constant.int 1 %int32_4641 = torch.constant.int 32 %int100_4642 = torch.constant.int 100 %3882 = torch.prim.ListConstruct %int4_4639, %int1_4640, %int32_4641, %int100_4642 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3883 = torch.aten.view %3877, %3882 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_4643 = torch.constant.int 4 %int1_4644 = torch.constant.int 1 %int32_4645 = torch.constant.int 32 %int-1_4646 = torch.constant.int -1 %int2_4647 = torch.constant.int 2 %3884 = torch.prim.ListConstruct %int4_4643, %int1_4644, %int32_4645, %int-1_4646, %int2_4647 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3885 = torch.aten.view %3879, %3884 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %3886 = torch.aten.view_as_complex %3885 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_4648 = torch.constant.int 4 %int1_4649 = torch.constant.int 1 %int32_4650 = torch.constant.int 32 %int-1_4651 = torch.constant.int -1 %int2_4652 = torch.constant.int 2 %3887 = torch.prim.ListConstruct %int4_4648, %int1_4649, %int32_4650, %int-1_4651, %int2_4652 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3888 = torch.aten.view %3881, %3887 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %3889 = torch.aten.view_as_complex %3888 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %3890 = torch.aten.mul.Tensor %3886, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %3891 = torch.aten.view_as_real %3890 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_4653 = torch.constant.int 4 %int1_4654 = torch.constant.int 1 %int32_4655 = torch.constant.int 32 %int100_4656 = torch.constant.int 100 %3892 = torch.prim.ListConstruct %int4_4653, %int1_4654, %int32_4655, %int100_4656 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3893 = torch.aten.view %3891, %3892 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %3894 = torch.aten.mul.Tensor %3889, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %3895 = torch.aten.view_as_real %3894 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_4657 = torch.constant.int 4 %int1_4658 = torch.constant.int 1 %int32_4659 = torch.constant.int 32 %int100_4660 = torch.constant.int 100 %3896 = torch.prim.ListConstruct %int4_4657, %int1_4658, %int32_4659, %int100_4660 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3897 = torch.aten.view %3895, %3896 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_4661 = torch.constant.int 1 %int1_4662 = torch.constant.int 1 %3898 = torch.aten.add.Scalar %arg2, %int1_4661, %int1_4662 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_4663 = torch.constant.int 0 %int0_4664 = torch.constant.int 0 %3899 = torch.aten.select.int %3898, %int0_4663, %int0_4664 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_4665 = torch.constant.int 0 %int0_4666 = torch.constant.int 0 %3900 = torch.aten.select.int %arg3, %int0_4665, %int0_4666 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_4667 = torch.constant.int 0 %int0_4668 = torch.constant.int 0 %int9223372036854775807_4669 = torch.constant.int 9223372036854775807 %int1_4670 = torch.constant.int 1 %3901 = torch.aten.slice.Tensor %3900, %int0_4667, %int0_4668, %int9223372036854775807_4669, %int1_4670 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_4671 = torch.constant.int 16 %3902 = torch.aten.floor_divide.Scalar %3899, %int16_4671 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_4672 = torch.constant.int 0 %3903 = torch.aten.index_select %3901, %int0_4672, %3902 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_4673 = torch.constant.int 16 %3904 = torch.aten.remainder.Scalar %3899, %int16_4673 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_4674 = torch.constant.none %3905 = torch.aten.clone %430, %none_4674 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4675 = torch.constant.none %3906 = torch.aten.clone %431, %none_4675 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4676 = torch.constant.int 0 %3907 = torch.aten.unsqueeze %3904, %int0_4676 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4677 = torch.constant.int 0 %int0_4678 = torch.constant.int 0 %3908 = torch.aten.select.int %3897, %int0_4677, %int0_4678 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4679 = torch.constant.int 0 %int0_4680 = torch.constant.int 0 %3909 = torch.aten.select.int %3908, %int0_4679, %int0_4680 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_4681 = torch.constant.int -1 %int26_4682 = torch.constant.int 26 %int2_4683 = torch.constant.int 2 %int16_4684 = torch.constant.int 16 %int32_4685 = torch.constant.int 32 %int100_4686 = torch.constant.int 100 %3910 = torch.prim.ListConstruct %int-1_4681, %int26_4682, %int2_4683, %int16_4684, %int32_4685, %int100_4686 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3911 = torch.aten.view %3745, %3910 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %3912 = torch.prim.ListConstruct %3903, %3905, %3906, %3907 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4687 = torch.constant.bool false %3913 = torch.aten.index_put %3911, %3912, %3909, %false_4687 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4688 = torch.constant.int 2662400 %3914 = torch.prim.ListConstruct %731, %int2662400_4688 : (!torch.int, !torch.int) -> !torch.list %3915 = torch.aten.view %3913, %3914 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4689 = torch.constant.int -1 %int26_4690 = torch.constant.int 26 %int2_4691 = torch.constant.int 2 %int16_4692 = torch.constant.int 16 %int32_4693 = torch.constant.int 32 %int100_4694 = torch.constant.int 100 %3916 = torch.prim.ListConstruct %int-1_4689, %int26_4690, %int2_4691, %int16_4692, %int32_4693, %int100_4694 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3917 = torch.aten.view %3915, %3916 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4695 = torch.constant.none %3918 = torch.aten.clone %432, %none_4695 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4696 = torch.constant.none %3919 = torch.aten.clone %433, %none_4696 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4697 = torch.constant.int 0 %3920 = torch.aten.unsqueeze %3904, %int0_4697 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4698 = torch.constant.int 0 %int0_4699 = torch.constant.int 0 %3921 = torch.aten.select.int %3883, %int0_4698, %int0_4699 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4700 = torch.constant.int 0 %int0_4701 = torch.constant.int 0 %3922 = torch.aten.select.int %3921, %int0_4700, %int0_4701 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3923 = torch.prim.ListConstruct %3903, %3918, %3919, %3920 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4702 = torch.constant.bool false %3924 = torch.aten.index_put %3917, %3923, %3922, %false_4702 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4703 = torch.constant.int 2662400 %3925 = torch.prim.ListConstruct %731, %int2662400_4703 : (!torch.int, !torch.int) -> !torch.list %3926 = torch.aten.view %3924, %3925 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4704 = torch.constant.int -1 %int26_4705 = torch.constant.int 26 %int2_4706 = torch.constant.int 2 %int16_4707 = torch.constant.int 16 %int32_4708 = torch.constant.int 32 %int100_4709 = torch.constant.int 100 %3927 = torch.prim.ListConstruct %int-1_4704, %int26_4705, %int2_4706, %int16_4707, %int32_4708, %int100_4709 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3928 = torch.aten.view %3926, %3927 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_4710 = torch.constant.int 0 %int1_4711 = torch.constant.int 1 %3929 = torch.aten.select.int %3898, %int0_4710, %int1_4711 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_4712 = torch.constant.int 0 %int1_4713 = torch.constant.int 1 %3930 = torch.aten.select.int %arg3, %int0_4712, %int1_4713 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_4714 = torch.constant.int 0 %int0_4715 = torch.constant.int 0 %int9223372036854775807_4716 = torch.constant.int 9223372036854775807 %int1_4717 = torch.constant.int 1 %3931 = torch.aten.slice.Tensor %3930, %int0_4714, %int0_4715, %int9223372036854775807_4716, %int1_4717 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_4718 = torch.constant.int 16 %3932 = torch.aten.floor_divide.Scalar %3929, %int16_4718 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_4719 = torch.constant.int 0 %3933 = torch.aten.index_select %3931, %int0_4719, %3932 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_4720 = torch.constant.int 16 %3934 = torch.aten.remainder.Scalar %3929, %int16_4720 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_4721 = torch.constant.none %3935 = torch.aten.clone %434, %none_4721 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4722 = torch.constant.none %3936 = torch.aten.clone %435, %none_4722 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4723 = torch.constant.int 0 %3937 = torch.aten.unsqueeze %3934, %int0_4723 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4724 = torch.constant.int 0 %int1_4725 = torch.constant.int 1 %3938 = torch.aten.select.int %3897, %int0_4724, %int1_4725 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4726 = torch.constant.int 0 %int0_4727 = torch.constant.int 0 %3939 = torch.aten.select.int %3938, %int0_4726, %int0_4727 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3940 = torch.prim.ListConstruct %3933, %3935, %3936, %3937 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4728 = torch.constant.bool false %3941 = torch.aten.index_put %3928, %3940, %3939, %false_4728 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4729 = torch.constant.int 2662400 %3942 = torch.prim.ListConstruct %731, %int2662400_4729 : (!torch.int, !torch.int) -> !torch.list %3943 = torch.aten.view %3941, %3942 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4730 = torch.constant.int -1 %int26_4731 = torch.constant.int 26 %int2_4732 = torch.constant.int 2 %int16_4733 = torch.constant.int 16 %int32_4734 = torch.constant.int 32 %int100_4735 = torch.constant.int 100 %3944 = torch.prim.ListConstruct %int-1_4730, %int26_4731, %int2_4732, %int16_4733, %int32_4734, %int100_4735 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3945 = torch.aten.view %3943, %3944 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4736 = torch.constant.none %3946 = torch.aten.clone %436, %none_4736 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4737 = torch.constant.none %3947 = torch.aten.clone %437, %none_4737 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4738 = torch.constant.int 0 %3948 = torch.aten.unsqueeze %3934, %int0_4738 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4739 = torch.constant.int 0 %int1_4740 = torch.constant.int 1 %3949 = torch.aten.select.int %3883, %int0_4739, %int1_4740 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4741 = torch.constant.int 0 %int0_4742 = torch.constant.int 0 %3950 = torch.aten.select.int %3949, %int0_4741, %int0_4742 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3951 = torch.prim.ListConstruct %3933, %3946, %3947, %3948 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4743 = torch.constant.bool false %3952 = torch.aten.index_put %3945, %3951, %3950, %false_4743 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4744 = torch.constant.int 2662400 %3953 = torch.prim.ListConstruct %731, %int2662400_4744 : (!torch.int, !torch.int) -> !torch.list %3954 = torch.aten.view %3952, %3953 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4745 = torch.constant.int -1 %int26_4746 = torch.constant.int 26 %int2_4747 = torch.constant.int 2 %int16_4748 = torch.constant.int 16 %int32_4749 = torch.constant.int 32 %int100_4750 = torch.constant.int 100 %3955 = torch.prim.ListConstruct %int-1_4745, %int26_4746, %int2_4747, %int16_4748, %int32_4749, %int100_4750 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3956 = torch.aten.view %3954, %3955 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_4751 = torch.constant.int 0 %int2_4752 = torch.constant.int 2 %3957 = torch.aten.select.int %3898, %int0_4751, %int2_4752 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_4753 = torch.constant.int 0 %int2_4754 = torch.constant.int 2 %3958 = torch.aten.select.int %arg3, %int0_4753, %int2_4754 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_4755 = torch.constant.int 0 %int0_4756 = torch.constant.int 0 %int9223372036854775807_4757 = torch.constant.int 9223372036854775807 %int1_4758 = torch.constant.int 1 %3959 = torch.aten.slice.Tensor %3958, %int0_4755, %int0_4756, %int9223372036854775807_4757, %int1_4758 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_4759 = torch.constant.int 16 %3960 = torch.aten.floor_divide.Scalar %3957, %int16_4759 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_4760 = torch.constant.int 0 %3961 = torch.aten.index_select %3959, %int0_4760, %3960 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_4761 = torch.constant.int 16 %3962 = torch.aten.remainder.Scalar %3957, %int16_4761 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_4762 = torch.constant.none %3963 = torch.aten.clone %438, %none_4762 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4763 = torch.constant.none %3964 = torch.aten.clone %439, %none_4763 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4764 = torch.constant.int 0 %3965 = torch.aten.unsqueeze %3962, %int0_4764 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4765 = torch.constant.int 0 %int2_4766 = torch.constant.int 2 %3966 = torch.aten.select.int %3897, %int0_4765, %int2_4766 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4767 = torch.constant.int 0 %int0_4768 = torch.constant.int 0 %3967 = torch.aten.select.int %3966, %int0_4767, %int0_4768 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3968 = torch.prim.ListConstruct %3961, %3963, %3964, %3965 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4769 = torch.constant.bool false %3969 = torch.aten.index_put %3956, %3968, %3967, %false_4769 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4770 = torch.constant.int 2662400 %3970 = torch.prim.ListConstruct %731, %int2662400_4770 : (!torch.int, !torch.int) -> !torch.list %3971 = torch.aten.view %3969, %3970 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4771 = torch.constant.int -1 %int26_4772 = torch.constant.int 26 %int2_4773 = torch.constant.int 2 %int16_4774 = torch.constant.int 16 %int32_4775 = torch.constant.int 32 %int100_4776 = torch.constant.int 100 %3972 = torch.prim.ListConstruct %int-1_4771, %int26_4772, %int2_4773, %int16_4774, %int32_4775, %int100_4776 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3973 = torch.aten.view %3971, %3972 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4777 = torch.constant.none %3974 = torch.aten.clone %440, %none_4777 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4778 = torch.constant.none %3975 = torch.aten.clone %441, %none_4778 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4779 = torch.constant.int 0 %3976 = torch.aten.unsqueeze %3962, %int0_4779 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4780 = torch.constant.int 0 %int2_4781 = torch.constant.int 2 %3977 = torch.aten.select.int %3883, %int0_4780, %int2_4781 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4782 = torch.constant.int 0 %int0_4783 = torch.constant.int 0 %3978 = torch.aten.select.int %3977, %int0_4782, %int0_4783 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3979 = torch.prim.ListConstruct %3961, %3974, %3975, %3976 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4784 = torch.constant.bool false %3980 = torch.aten.index_put %3973, %3979, %3978, %false_4784 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4785 = torch.constant.int 2662400 %3981 = torch.prim.ListConstruct %731, %int2662400_4785 : (!torch.int, !torch.int) -> !torch.list %3982 = torch.aten.view %3980, %3981 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4786 = torch.constant.int -1 %int26_4787 = torch.constant.int 26 %int2_4788 = torch.constant.int 2 %int16_4789 = torch.constant.int 16 %int32_4790 = torch.constant.int 32 %int100_4791 = torch.constant.int 100 %3983 = torch.prim.ListConstruct %int-1_4786, %int26_4787, %int2_4788, %int16_4789, %int32_4790, %int100_4791 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %3984 = torch.aten.view %3982, %3983 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_4792 = torch.constant.int 0 %int3_4793 = torch.constant.int 3 %3985 = torch.aten.select.int %3898, %int0_4792, %int3_4793 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_4794 = torch.constant.int 0 %int3_4795 = torch.constant.int 3 %3986 = torch.aten.select.int %arg3, %int0_4794, %int3_4795 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_4796 = torch.constant.int 0 %int0_4797 = torch.constant.int 0 %int9223372036854775807_4798 = torch.constant.int 9223372036854775807 %int1_4799 = torch.constant.int 1 %3987 = torch.aten.slice.Tensor %3986, %int0_4796, %int0_4797, %int9223372036854775807_4798, %int1_4799 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_4800 = torch.constant.int 16 %3988 = torch.aten.floor_divide.Scalar %3985, %int16_4800 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_4801 = torch.constant.int 0 %3989 = torch.aten.index_select %3987, %int0_4801, %3988 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_4802 = torch.constant.int 16 %3990 = torch.aten.remainder.Scalar %3985, %int16_4802 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_4803 = torch.constant.none %3991 = torch.aten.clone %442, %none_4803 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4804 = torch.constant.none %3992 = torch.aten.clone %443, %none_4804 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4805 = torch.constant.int 0 %3993 = torch.aten.unsqueeze %3990, %int0_4805 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4806 = torch.constant.int 0 %int3_4807 = torch.constant.int 3 %3994 = torch.aten.select.int %3897, %int0_4806, %int3_4807 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4808 = torch.constant.int 0 %int0_4809 = torch.constant.int 0 %3995 = torch.aten.select.int %3994, %int0_4808, %int0_4809 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %3996 = torch.prim.ListConstruct %3989, %3991, %3992, %3993 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4810 = torch.constant.bool false %3997 = torch.aten.index_put %3984, %3996, %3995, %false_4810 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4811 = torch.constant.int 2662400 %3998 = torch.prim.ListConstruct %731, %int2662400_4811 : (!torch.int, !torch.int) -> !torch.list %3999 = torch.aten.view %3997, %3998 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_4812 = torch.constant.int -1 %int26_4813 = torch.constant.int 26 %int2_4814 = torch.constant.int 2 %int16_4815 = torch.constant.int 16 %int32_4816 = torch.constant.int 32 %int100_4817 = torch.constant.int 100 %4000 = torch.prim.ListConstruct %int-1_4812, %int26_4813, %int2_4814, %int16_4815, %int32_4816, %int100_4817 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4001 = torch.aten.view %3999, %4000 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_4818 = torch.constant.none %4002 = torch.aten.clone %444, %none_4818 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_4819 = torch.constant.none %4003 = torch.aten.clone %445, %none_4819 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_4820 = torch.constant.int 0 %4004 = torch.aten.unsqueeze %3990, %int0_4820 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_4821 = torch.constant.int 0 %int3_4822 = torch.constant.int 3 %4005 = torch.aten.select.int %3883, %int0_4821, %int3_4822 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_4823 = torch.constant.int 0 %int0_4824 = torch.constant.int 0 %4006 = torch.aten.select.int %4005, %int0_4823, %int0_4824 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4007 = torch.prim.ListConstruct %3989, %4002, %4003, %4004 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_4825 = torch.constant.bool false %4008 = torch.aten.index_put %4001, %4007, %4006, %false_4825 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_4826 = torch.constant.int 2662400 %4009 = torch.prim.ListConstruct %731, %int2662400_4826 : (!torch.int, !torch.int) -> !torch.list %4010 = torch.aten.view %4008, %4009 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_4827 = torch.constant.int 52 %4011 = torch.aten.mul.Scalar %arg3, %int52_4827 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int24 = torch.constant.int 24 %int1_4828 = torch.constant.int 1 %4012 = torch.aten.add.Scalar %4011, %int24, %int1_4828 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_4829 = torch.constant.int 4 %4013 = torch.aten.mul.int %int4_4829, %655 : !torch.int, !torch.int -> !torch.int %4014 = torch.prim.ListConstruct %4013 : (!torch.int) -> !torch.list %4015 = torch.aten.view %4012, %4014 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_4830 = torch.constant.int -1 %int26_4831 = torch.constant.int 26 %int2_4832 = torch.constant.int 2 %int16_4833 = torch.constant.int 16 %int32_4834 = torch.constant.int 32 %int100_4835 = torch.constant.int 100 %4016 = torch.prim.ListConstruct %int-1_4830, %int26_4831, %int2_4832, %int16_4833, %int32_4834, %int100_4835 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4017 = torch.aten.view %4010, %4016 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_4836 = torch.constant.int 26 %4018 = torch.aten.mul.int %731, %int26_4836 : !torch.int, !torch.int -> !torch.int %int2_4837 = torch.constant.int 2 %4019 = torch.aten.mul.int %4018, %int2_4837 : !torch.int, !torch.int -> !torch.int %int16_4838 = torch.constant.int 16 %int32_4839 = torch.constant.int 32 %int100_4840 = torch.constant.int 100 %4020 = torch.prim.ListConstruct %4019, %int16_4838, %int32_4839, %int100_4840 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4021 = torch.aten.view %4017, %4020 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_4841 = torch.constant.int 0 %4022 = torch.aten.index_select %4021, %int0_4841, %4015 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_4842 = torch.constant.int 4 %int16_4843 = torch.constant.int 16 %int32_4844 = torch.constant.int 32 %int100_4845 = torch.constant.int 100 %4023 = torch.prim.ListConstruct %int4_4842, %655, %int16_4843, %int32_4844, %int100_4845 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4024 = torch.aten.view %4022, %4023 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_4846 = torch.constant.int 1 %4025 = torch.aten.size.int %4024, %int1_4846 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_4847 = torch.constant.int 16 %4026 = torch.aten.mul.int %4025, %int16_4847 : !torch.int, !torch.int -> !torch.int %int4_4848 = torch.constant.int 4 %int32_4849 = torch.constant.int 32 %int100_4850 = torch.constant.int 100 %4027 = torch.prim.ListConstruct %int4_4848, %4026, %int32_4849, %int100_4850 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4028 = torch.aten.view %4024, %4027 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_4851 = torch.constant.int 0 %int0_4852 = torch.constant.int 0 %int9223372036854775807_4853 = torch.constant.int 9223372036854775807 %int1_4854 = torch.constant.int 1 %4029 = torch.aten.slice.Tensor %3770, %int0_4851, %int0_4852, %int9223372036854775807_4853, %int1_4854 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_4855 = torch.constant.int 16 %4030 = torch.aten.mul.int %655, %int16_4855 : !torch.int, !torch.int -> !torch.int %int1_4856 = torch.constant.int 1 %int0_4857 = torch.constant.int 0 %int1_4858 = torch.constant.int 1 %4031 = torch.aten.slice.Tensor %4029, %int1_4856, %int0_4857, %4030, %int1_4858 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_4859 = torch.constant.bool false %4032 = torch.aten.copy %4031, %4028, %false_4859 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_4860 = torch.constant.int 0 %int0_4861 = torch.constant.int 0 %int9223372036854775807_4862 = torch.constant.int 9223372036854775807 %int1_4863 = torch.constant.int 1 %4033 = torch.aten.slice.Tensor %3770, %int0_4860, %int0_4861, %int9223372036854775807_4862, %int1_4863 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4864 = torch.constant.int 1 %int0_4865 = torch.constant.int 0 %int1_4866 = torch.constant.int 1 %4034 = torch.aten.slice_scatter %4033, %4032, %int1_4864, %int0_4865, %4030, %int1_4866 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_4867 = torch.constant.int 0 %int0_4868 = torch.constant.int 0 %int9223372036854775807_4869 = torch.constant.int 9223372036854775807 %int1_4870 = torch.constant.int 1 %4035 = torch.aten.slice_scatter %3770, %4034, %int0_4867, %int0_4868, %int9223372036854775807_4869, %int1_4870 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4871 = torch.constant.int 1 %int1_4872 = torch.constant.int 1 %4036 = torch.aten.add.Scalar %4012, %int1_4871, %int1_4872 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_4873 = torch.constant.int 4 %4037 = torch.aten.mul.int %int4_4873, %655 : !torch.int, !torch.int -> !torch.int %4038 = torch.prim.ListConstruct %4037 : (!torch.int) -> !torch.list %4039 = torch.aten.view %4036, %4038 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_4874 = torch.constant.int 0 %4040 = torch.aten.index_select %4021, %int0_4874, %4039 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_4875 = torch.constant.int 4 %int16_4876 = torch.constant.int 16 %int32_4877 = torch.constant.int 32 %int100_4878 = torch.constant.int 100 %4041 = torch.prim.ListConstruct %int4_4875, %655, %int16_4876, %int32_4877, %int100_4878 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4042 = torch.aten.view %4040, %4041 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_4879 = torch.constant.int 1 %4043 = torch.aten.size.int %4042, %int1_4879 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_4880 = torch.constant.int 16 %4044 = torch.aten.mul.int %4043, %int16_4880 : !torch.int, !torch.int -> !torch.int %int4_4881 = torch.constant.int 4 %int32_4882 = torch.constant.int 32 %int100_4883 = torch.constant.int 100 %4045 = torch.prim.ListConstruct %int4_4881, %4044, %int32_4882, %int100_4883 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4046 = torch.aten.view %4042, %4045 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_4884 = torch.constant.int 0 %int0_4885 = torch.constant.int 0 %int9223372036854775807_4886 = torch.constant.int 9223372036854775807 %int1_4887 = torch.constant.int 1 %4047 = torch.aten.slice.Tensor %3787, %int0_4884, %int0_4885, %int9223372036854775807_4886, %int1_4887 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4888 = torch.constant.int 1 %int0_4889 = torch.constant.int 0 %int1_4890 = torch.constant.int 1 %4048 = torch.aten.slice.Tensor %4047, %int1_4888, %int0_4889, %4030, %int1_4890 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_4891 = torch.constant.bool false %4049 = torch.aten.copy %4048, %4046, %false_4891 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_4892 = torch.constant.int 0 %int0_4893 = torch.constant.int 0 %int9223372036854775807_4894 = torch.constant.int 9223372036854775807 %int1_4895 = torch.constant.int 1 %4050 = torch.aten.slice.Tensor %3787, %int0_4892, %int0_4893, %int9223372036854775807_4894, %int1_4895 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4896 = torch.constant.int 1 %int0_4897 = torch.constant.int 0 %int1_4898 = torch.constant.int 1 %4051 = torch.aten.slice_scatter %4050, %4049, %int1_4896, %int0_4897, %4030, %int1_4898 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_4899 = torch.constant.int 0 %int0_4900 = torch.constant.int 0 %int9223372036854775807_4901 = torch.constant.int 9223372036854775807 %int1_4902 = torch.constant.int 1 %4052 = torch.aten.slice_scatter %3787, %4051, %int0_4899, %int0_4900, %int9223372036854775807_4901, %int1_4902 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_4903 = torch.constant.int 0 %int0_4904 = torch.constant.int 0 %int9223372036854775807_4905 = torch.constant.int 9223372036854775807 %int1_4906 = torch.constant.int 1 %4053 = torch.aten.slice.Tensor %671, %int0_4903, %int0_4904, %int9223372036854775807_4905, %int1_4906 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4907 = torch.constant.int 1 %int0_4908 = torch.constant.int 0 %int1_4909 = torch.constant.int 1 %4054 = torch.aten.slice.Tensor %4053, %int1_4907, %int0_4908, %4030, %int1_4909 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_4910 = torch.constant.int 0 %int0_4911 = torch.constant.int 0 %int9223372036854775807_4912 = torch.constant.int 9223372036854775807 %int1_4913 = torch.constant.int 1 %4055 = torch.aten.slice.Tensor %673, %int0_4910, %int0_4911, %int9223372036854775807_4912, %int1_4913 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4914 = torch.constant.int 1 %int0_4915 = torch.constant.int 0 %int1_4916 = torch.constant.int 1 %4056 = torch.aten.slice.Tensor %4055, %int1_4914, %int0_4915, %4030, %int1_4916 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_4917 = torch.constant.int 1 %int2_4918 = torch.constant.int 2 %4057 = torch.aten.transpose.int %3893, %int1_4917, %int2_4918 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_4919 = torch.constant.int 4 %int32_4920 = torch.constant.int 32 %int1_4921 = torch.constant.int 1 %int100_4922 = torch.constant.int 100 %4058 = torch.prim.ListConstruct %int4_4919, %int32_4920, %int1_4921, %int100_4922 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4923 = torch.constant.bool false %4059 = torch.aten.expand %4057, %4058, %false_4923 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_4924 = torch.constant.int 128 %int1_4925 = torch.constant.int 1 %int100_4926 = torch.constant.int 100 %4060 = torch.prim.ListConstruct %int128_4924, %int1_4925, %int100_4926 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4061 = torch.aten.view %4059, %4060 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_4927 = torch.constant.int 0 %int0_4928 = torch.constant.int 0 %int9223372036854775807_4929 = torch.constant.int 9223372036854775807 %int1_4930 = torch.constant.int 1 %4062 = torch.aten.slice.Tensor %4035, %int0_4927, %int0_4928, %int9223372036854775807_4929, %int1_4930 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4931 = torch.constant.int 1 %int0_4932 = torch.constant.int 0 %int1_4933 = torch.constant.int 1 %4063 = torch.aten.slice.Tensor %4062, %int1_4931, %int0_4932, %4030, %int1_4933 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_4934 = torch.constant.int 1 %int2_4935 = torch.constant.int 2 %4064 = torch.aten.transpose.int %4063, %int1_4934, %int2_4935 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_4936 = torch.constant.int 2 %int3_4937 = torch.constant.int 3 %4065 = torch.aten.transpose.int %4064, %int2_4936, %int3_4937 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_4938 = torch.constant.int 1 %4066 = torch.aten.size.int %4054, %int1_4938 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_4939 = torch.constant.int 4 %int32_4940 = torch.constant.int 32 %int100_4941 = torch.constant.int 100 %4067 = torch.prim.ListConstruct %int4_4939, %int32_4940, %int100_4941, %4066 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4942 = torch.constant.bool false %4068 = torch.aten.expand %4065, %4067, %false_4942 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_4943 = torch.constant.int 0 %4069 = torch.aten.clone %4068, %int0_4943 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_4944 = torch.constant.int 128 %int100_4945 = torch.constant.int 100 %4070 = torch.prim.ListConstruct %int128_4944, %int100_4945, %4066 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4071 = torch.aten._unsafe_view %4069, %4070 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %4072 = torch.aten.bmm %4061, %4071 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_4946 = torch.constant.int 4 %int32_4947 = torch.constant.int 32 %int1_4948 = torch.constant.int 1 %4073 = torch.prim.ListConstruct %int4_4946, %int32_4947, %int1_4948, %4066 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4074 = torch.aten.view %4072, %4073 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_4949 = torch.constant.float 1.000000e+01 %4075 = torch.aten.div.Scalar %4074, %float1.000000e01_4949 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_4950 = torch.constant.int 1 %4076 = torch.aten.add.Tensor %4075, %895, %int1_4950 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_4951 = torch.constant.int -1 %false_4952 = torch.constant.bool false %4077 = torch.aten._softmax %4076, %int-1_4951, %false_4952 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_4953 = torch.constant.int 4 %int32_4954 = torch.constant.int 32 %int1_4955 = torch.constant.int 1 %4078 = torch.prim.ListConstruct %int4_4953, %int32_4954, %int1_4955, %4066 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4956 = torch.constant.bool false %4079 = torch.aten.expand %4077, %4078, %false_4956 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_4957 = torch.constant.int 128 %int1_4958 = torch.constant.int 1 %4080 = torch.prim.ListConstruct %int128_4957, %int1_4958, %4066 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4081 = torch.aten.view %4079, %4080 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_4959 = torch.constant.int 0 %int0_4960 = torch.constant.int 0 %int9223372036854775807_4961 = torch.constant.int 9223372036854775807 %int1_4962 = torch.constant.int 1 %4082 = torch.aten.slice.Tensor %4052, %int0_4959, %int0_4960, %int9223372036854775807_4961, %int1_4962 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_4963 = torch.constant.int 1 %int0_4964 = torch.constant.int 0 %int1_4965 = torch.constant.int 1 %4083 = torch.aten.slice.Tensor %4082, %int1_4963, %int0_4964, %4030, %int1_4965 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_4966 = torch.constant.int 1 %int2_4967 = torch.constant.int 2 %4084 = torch.aten.transpose.int %4083, %int1_4966, %int2_4967 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_4968 = torch.constant.int 1 %4085 = torch.aten.size.int %4056, %int1_4968 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_4969 = torch.constant.int 4 %int32_4970 = torch.constant.int 32 %int100_4971 = torch.constant.int 100 %4086 = torch.prim.ListConstruct %int4_4969, %int32_4970, %4085, %int100_4971 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_4972 = torch.constant.bool false %4087 = torch.aten.expand %4084, %4086, %false_4972 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_4973 = torch.constant.int 0 %4088 = torch.aten.clone %4087, %int0_4973 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_4974 = torch.constant.int 128 %int100_4975 = torch.constant.int 100 %4089 = torch.prim.ListConstruct %int128_4974, %4085, %int100_4975 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4090 = torch.aten._unsafe_view %4088, %4089 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %4091 = torch.aten.bmm %4081, %4090 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_4976 = torch.constant.int 4 %int32_4977 = torch.constant.int 32 %int1_4978 = torch.constant.int 1 %int100_4979 = torch.constant.int 100 %4092 = torch.prim.ListConstruct %int4_4976, %int32_4977, %int1_4978, %int100_4979 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4093 = torch.aten.view %4091, %4092 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_4980 = torch.constant.int 1 %int2_4981 = torch.constant.int 2 %4094 = torch.aten.transpose.int %4093, %int1_4980, %int2_4981 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_4982 = torch.constant.int 4 %int1_4983 = torch.constant.int 1 %int-1_4984 = torch.constant.int -1 %4095 = torch.prim.ListConstruct %int4_4982, %int1_4983, %int-1_4984 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4096 = torch.aten.view %4094, %4095 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %4097 = torch_c.to_builtin_tensor %4096 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4985 = tensor.cast %4097 : tensor<4x1x3200xf32> to tensor %4098 = torch_c.to_builtin_tensor %114 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4099 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_4985, %4098) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_4986 = tensor.cast %4099 : tensor to tensor<4x1x3200xf32> %4100 = torch_c.from_builtin_tensor %cast_4986 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_4987 = torch.constant.int 1 %4101 = torch.aten.add.Tensor %3858, %4100, %int1_4987 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_4988 = torch.constant.int 2 %4102 = torch.aten.pow.Tensor_Scalar %4101, %int2_4988 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_4989 = torch.constant.int -1 %4103 = torch.prim.ListConstruct %int-1_4989 : (!torch.int) -> !torch.list %true_4990 = torch.constant.bool true %none_4991 = torch.constant.none %4104 = torch.aten.mean.dim %4102, %4103, %true_4990, %none_4991 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_4992 = torch.constant.float 9.9999999747524271E-7 %int1_4993 = torch.constant.int 1 %4105 = torch.aten.add.Scalar %4104, %float9.999990e-07_4992, %int1_4993 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %4106 = torch.aten.rsqrt %4105 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %4107 = torch.aten.mul.Tensor %4101, %4106 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %4108 = torch.aten.mul.Tensor %4107, %115 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %4109 = torch_c.to_builtin_tensor %4108 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4994 = tensor.cast %4109 : tensor<4x1x3200xf32> to tensor %4110 = torch_c.to_builtin_tensor %116 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %4111 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_4994, %4110) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_4995 = tensor.cast %4111 : tensor to tensor<4x1x8640xf32> %4112 = torch_c.from_builtin_tensor %cast_4995 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %4113 = torch.aten.silu %4112 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %4114 = torch_c.to_builtin_tensor %4108 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_4996 = tensor.cast %4114 : tensor<4x1x3200xf32> to tensor %4115 = torch_c.to_builtin_tensor %117 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %4116 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_4996, %4115) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_4997 = tensor.cast %4116 : tensor to tensor<4x1x8640xf32> %4117 = torch_c.from_builtin_tensor %cast_4997 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %4118 = torch.aten.mul.Tensor %4113, %4117 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %4119 = torch_c.to_builtin_tensor %4118 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_4998 = tensor.cast %4119 : tensor<4x1x8640xf32> to tensor %4120 = torch_c.to_builtin_tensor %118 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %4121 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_4998, %4120) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_4999 = tensor.cast %4121 : tensor to tensor<4x1x3200xf32> %4122 = torch_c.from_builtin_tensor %cast_4999 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_5000 = torch.constant.int 1 %4123 = torch.aten.add.Tensor %4101, %4122, %int1_5000 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_5001 = torch.constant.int 2 %4124 = torch.aten.pow.Tensor_Scalar %4123, %int2_5001 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_5002 = torch.constant.int -1 %4125 = torch.prim.ListConstruct %int-1_5002 : (!torch.int) -> !torch.list %true_5003 = torch.constant.bool true %none_5004 = torch.constant.none %4126 = torch.aten.mean.dim %4124, %4125, %true_5003, %none_5004 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_5005 = torch.constant.float 9.9999999747524271E-7 %int1_5006 = torch.constant.int 1 %4127 = torch.aten.add.Scalar %4126, %float9.999990e-07_5005, %int1_5006 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %4128 = torch.aten.rsqrt %4127 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %4129 = torch.aten.mul.Tensor %4123, %4128 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %4130 = torch.aten.mul.Tensor %4129, %119 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %4131 = torch_c.to_builtin_tensor %4130 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5007 = tensor.cast %4131 : tensor<4x1x3200xf32> to tensor %4132 = torch_c.to_builtin_tensor %120 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4133 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5007, %4132) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5008 = tensor.cast %4133 : tensor to tensor<4x1x3200xf32> %4134 = torch_c.from_builtin_tensor %cast_5008 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %4135 = torch_c.to_builtin_tensor %4130 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5009 = tensor.cast %4135 : tensor<4x1x3200xf32> to tensor %4136 = torch_c.to_builtin_tensor %121 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4137 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5009, %4136) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5010 = tensor.cast %4137 : tensor to tensor<4x1x3200xf32> %4138 = torch_c.from_builtin_tensor %cast_5010 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %4139 = torch_c.to_builtin_tensor %4130 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5011 = tensor.cast %4139 : tensor<4x1x3200xf32> to tensor %4140 = torch_c.to_builtin_tensor %122 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4141 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5011, %4140) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5012 = tensor.cast %4141 : tensor to tensor<4x1x3200xf32> %4142 = torch_c.from_builtin_tensor %cast_5012 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_5013 = torch.constant.int 4 %int1_5014 = torch.constant.int 1 %int32_5015 = torch.constant.int 32 %int100_5016 = torch.constant.int 100 %4143 = torch.prim.ListConstruct %int4_5013, %int1_5014, %int32_5015, %int100_5016 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4144 = torch.aten.view %4134, %4143 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_5017 = torch.constant.int 4 %int1_5018 = torch.constant.int 1 %int32_5019 = torch.constant.int 32 %int100_5020 = torch.constant.int 100 %4145 = torch.prim.ListConstruct %int4_5017, %int1_5018, %int32_5019, %int100_5020 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4146 = torch.aten.view %4138, %4145 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_5021 = torch.constant.int 4 %int1_5022 = torch.constant.int 1 %int32_5023 = torch.constant.int 32 %int100_5024 = torch.constant.int 100 %4147 = torch.prim.ListConstruct %int4_5021, %int1_5022, %int32_5023, %int100_5024 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4148 = torch.aten.view %4142, %4147 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_5025 = torch.constant.int 4 %int1_5026 = torch.constant.int 1 %int32_5027 = torch.constant.int 32 %int-1_5028 = torch.constant.int -1 %int2_5029 = torch.constant.int 2 %4149 = torch.prim.ListConstruct %int4_5025, %int1_5026, %int32_5027, %int-1_5028, %int2_5029 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4150 = torch.aten.view %4144, %4149 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %4151 = torch.aten.view_as_complex %4150 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_5030 = torch.constant.int 4 %int1_5031 = torch.constant.int 1 %int32_5032 = torch.constant.int 32 %int-1_5033 = torch.constant.int -1 %int2_5034 = torch.constant.int 2 %4152 = torch.prim.ListConstruct %int4_5030, %int1_5031, %int32_5032, %int-1_5033, %int2_5034 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4153 = torch.aten.view %4146, %4152 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %4154 = torch.aten.view_as_complex %4153 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %4155 = torch.aten.mul.Tensor %4151, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %4156 = torch.aten.view_as_real %4155 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_5035 = torch.constant.int 4 %int1_5036 = torch.constant.int 1 %int32_5037 = torch.constant.int 32 %int100_5038 = torch.constant.int 100 %4157 = torch.prim.ListConstruct %int4_5035, %int1_5036, %int32_5037, %int100_5038 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4158 = torch.aten.view %4156, %4157 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %4159 = torch.aten.mul.Tensor %4154, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %4160 = torch.aten.view_as_real %4159 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_5039 = torch.constant.int 4 %int1_5040 = torch.constant.int 1 %int32_5041 = torch.constant.int 32 %int100_5042 = torch.constant.int 100 %4161 = torch.prim.ListConstruct %int4_5039, %int1_5040, %int32_5041, %int100_5042 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4162 = torch.aten.view %4160, %4161 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_5043 = torch.constant.int 1 %int1_5044 = torch.constant.int 1 %4163 = torch.aten.add.Scalar %arg2, %int1_5043, %int1_5044 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_5045 = torch.constant.int 0 %int0_5046 = torch.constant.int 0 %4164 = torch.aten.select.int %4163, %int0_5045, %int0_5046 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5047 = torch.constant.int 0 %int0_5048 = torch.constant.int 0 %4165 = torch.aten.select.int %arg3, %int0_5047, %int0_5048 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5049 = torch.constant.int 0 %int0_5050 = torch.constant.int 0 %int9223372036854775807_5051 = torch.constant.int 9223372036854775807 %int1_5052 = torch.constant.int 1 %4166 = torch.aten.slice.Tensor %4165, %int0_5049, %int0_5050, %int9223372036854775807_5051, %int1_5052 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5053 = torch.constant.int 16 %4167 = torch.aten.floor_divide.Scalar %4164, %int16_5053 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5054 = torch.constant.int 0 %4168 = torch.aten.index_select %4166, %int0_5054, %4167 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5055 = torch.constant.int 16 %4169 = torch.aten.remainder.Scalar %4164, %int16_5055 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5056 = torch.constant.none %4170 = torch.aten.clone %446, %none_5056 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5057 = torch.constant.none %4171 = torch.aten.clone %447, %none_5057 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5058 = torch.constant.int 0 %4172 = torch.aten.unsqueeze %4169, %int0_5058 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5059 = torch.constant.int 0 %int0_5060 = torch.constant.int 0 %4173 = torch.aten.select.int %4162, %int0_5059, %int0_5060 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5061 = torch.constant.int 0 %int0_5062 = torch.constant.int 0 %4174 = torch.aten.select.int %4173, %int0_5061, %int0_5062 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_5063 = torch.constant.int -1 %int26_5064 = torch.constant.int 26 %int2_5065 = torch.constant.int 2 %int16_5066 = torch.constant.int 16 %int32_5067 = torch.constant.int 32 %int100_5068 = torch.constant.int 100 %4175 = torch.prim.ListConstruct %int-1_5063, %int26_5064, %int2_5065, %int16_5066, %int32_5067, %int100_5068 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4176 = torch.aten.view %4010, %4175 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %4177 = torch.prim.ListConstruct %4168, %4170, %4171, %4172 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5069 = torch.constant.bool false %4178 = torch.aten.index_put %4176, %4177, %4174, %false_5069 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5070 = torch.constant.int 2662400 %4179 = torch.prim.ListConstruct %731, %int2662400_5070 : (!torch.int, !torch.int) -> !torch.list %4180 = torch.aten.view %4178, %4179 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5071 = torch.constant.int -1 %int26_5072 = torch.constant.int 26 %int2_5073 = torch.constant.int 2 %int16_5074 = torch.constant.int 16 %int32_5075 = torch.constant.int 32 %int100_5076 = torch.constant.int 100 %4181 = torch.prim.ListConstruct %int-1_5071, %int26_5072, %int2_5073, %int16_5074, %int32_5075, %int100_5076 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4182 = torch.aten.view %4180, %4181 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5077 = torch.constant.none %4183 = torch.aten.clone %448, %none_5077 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5078 = torch.constant.none %4184 = torch.aten.clone %449, %none_5078 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5079 = torch.constant.int 0 %4185 = torch.aten.unsqueeze %4169, %int0_5079 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5080 = torch.constant.int 0 %int0_5081 = torch.constant.int 0 %4186 = torch.aten.select.int %4148, %int0_5080, %int0_5081 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5082 = torch.constant.int 0 %int0_5083 = torch.constant.int 0 %4187 = torch.aten.select.int %4186, %int0_5082, %int0_5083 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4188 = torch.prim.ListConstruct %4168, %4183, %4184, %4185 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5084 = torch.constant.bool false %4189 = torch.aten.index_put %4182, %4188, %4187, %false_5084 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5085 = torch.constant.int 2662400 %4190 = torch.prim.ListConstruct %731, %int2662400_5085 : (!torch.int, !torch.int) -> !torch.list %4191 = torch.aten.view %4189, %4190 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5086 = torch.constant.int -1 %int26_5087 = torch.constant.int 26 %int2_5088 = torch.constant.int 2 %int16_5089 = torch.constant.int 16 %int32_5090 = torch.constant.int 32 %int100_5091 = torch.constant.int 100 %4192 = torch.prim.ListConstruct %int-1_5086, %int26_5087, %int2_5088, %int16_5089, %int32_5090, %int100_5091 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4193 = torch.aten.view %4191, %4192 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_5092 = torch.constant.int 0 %int1_5093 = torch.constant.int 1 %4194 = torch.aten.select.int %4163, %int0_5092, %int1_5093 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5094 = torch.constant.int 0 %int1_5095 = torch.constant.int 1 %4195 = torch.aten.select.int %arg3, %int0_5094, %int1_5095 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5096 = torch.constant.int 0 %int0_5097 = torch.constant.int 0 %int9223372036854775807_5098 = torch.constant.int 9223372036854775807 %int1_5099 = torch.constant.int 1 %4196 = torch.aten.slice.Tensor %4195, %int0_5096, %int0_5097, %int9223372036854775807_5098, %int1_5099 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5100 = torch.constant.int 16 %4197 = torch.aten.floor_divide.Scalar %4194, %int16_5100 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5101 = torch.constant.int 0 %4198 = torch.aten.index_select %4196, %int0_5101, %4197 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5102 = torch.constant.int 16 %4199 = torch.aten.remainder.Scalar %4194, %int16_5102 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5103 = torch.constant.none %4200 = torch.aten.clone %450, %none_5103 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5104 = torch.constant.none %4201 = torch.aten.clone %451, %none_5104 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5105 = torch.constant.int 0 %4202 = torch.aten.unsqueeze %4199, %int0_5105 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5106 = torch.constant.int 0 %int1_5107 = torch.constant.int 1 %4203 = torch.aten.select.int %4162, %int0_5106, %int1_5107 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5108 = torch.constant.int 0 %int0_5109 = torch.constant.int 0 %4204 = torch.aten.select.int %4203, %int0_5108, %int0_5109 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4205 = torch.prim.ListConstruct %4198, %4200, %4201, %4202 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5110 = torch.constant.bool false %4206 = torch.aten.index_put %4193, %4205, %4204, %false_5110 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5111 = torch.constant.int 2662400 %4207 = torch.prim.ListConstruct %731, %int2662400_5111 : (!torch.int, !torch.int) -> !torch.list %4208 = torch.aten.view %4206, %4207 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5112 = torch.constant.int -1 %int26_5113 = torch.constant.int 26 %int2_5114 = torch.constant.int 2 %int16_5115 = torch.constant.int 16 %int32_5116 = torch.constant.int 32 %int100_5117 = torch.constant.int 100 %4209 = torch.prim.ListConstruct %int-1_5112, %int26_5113, %int2_5114, %int16_5115, %int32_5116, %int100_5117 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4210 = torch.aten.view %4208, %4209 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5118 = torch.constant.none %4211 = torch.aten.clone %452, %none_5118 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5119 = torch.constant.none %4212 = torch.aten.clone %453, %none_5119 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5120 = torch.constant.int 0 %4213 = torch.aten.unsqueeze %4199, %int0_5120 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5121 = torch.constant.int 0 %int1_5122 = torch.constant.int 1 %4214 = torch.aten.select.int %4148, %int0_5121, %int1_5122 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5123 = torch.constant.int 0 %int0_5124 = torch.constant.int 0 %4215 = torch.aten.select.int %4214, %int0_5123, %int0_5124 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4216 = torch.prim.ListConstruct %4198, %4211, %4212, %4213 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5125 = torch.constant.bool false %4217 = torch.aten.index_put %4210, %4216, %4215, %false_5125 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5126 = torch.constant.int 2662400 %4218 = torch.prim.ListConstruct %731, %int2662400_5126 : (!torch.int, !torch.int) -> !torch.list %4219 = torch.aten.view %4217, %4218 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5127 = torch.constant.int -1 %int26_5128 = torch.constant.int 26 %int2_5129 = torch.constant.int 2 %int16_5130 = torch.constant.int 16 %int32_5131 = torch.constant.int 32 %int100_5132 = torch.constant.int 100 %4220 = torch.prim.ListConstruct %int-1_5127, %int26_5128, %int2_5129, %int16_5130, %int32_5131, %int100_5132 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4221 = torch.aten.view %4219, %4220 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_5133 = torch.constant.int 0 %int2_5134 = torch.constant.int 2 %4222 = torch.aten.select.int %4163, %int0_5133, %int2_5134 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5135 = torch.constant.int 0 %int2_5136 = torch.constant.int 2 %4223 = torch.aten.select.int %arg3, %int0_5135, %int2_5136 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5137 = torch.constant.int 0 %int0_5138 = torch.constant.int 0 %int9223372036854775807_5139 = torch.constant.int 9223372036854775807 %int1_5140 = torch.constant.int 1 %4224 = torch.aten.slice.Tensor %4223, %int0_5137, %int0_5138, %int9223372036854775807_5139, %int1_5140 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5141 = torch.constant.int 16 %4225 = torch.aten.floor_divide.Scalar %4222, %int16_5141 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5142 = torch.constant.int 0 %4226 = torch.aten.index_select %4224, %int0_5142, %4225 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5143 = torch.constant.int 16 %4227 = torch.aten.remainder.Scalar %4222, %int16_5143 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5144 = torch.constant.none %4228 = torch.aten.clone %454, %none_5144 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5145 = torch.constant.none %4229 = torch.aten.clone %455, %none_5145 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5146 = torch.constant.int 0 %4230 = torch.aten.unsqueeze %4227, %int0_5146 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5147 = torch.constant.int 0 %int2_5148 = torch.constant.int 2 %4231 = torch.aten.select.int %4162, %int0_5147, %int2_5148 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5149 = torch.constant.int 0 %int0_5150 = torch.constant.int 0 %4232 = torch.aten.select.int %4231, %int0_5149, %int0_5150 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4233 = torch.prim.ListConstruct %4226, %4228, %4229, %4230 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5151 = torch.constant.bool false %4234 = torch.aten.index_put %4221, %4233, %4232, %false_5151 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5152 = torch.constant.int 2662400 %4235 = torch.prim.ListConstruct %731, %int2662400_5152 : (!torch.int, !torch.int) -> !torch.list %4236 = torch.aten.view %4234, %4235 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5153 = torch.constant.int -1 %int26_5154 = torch.constant.int 26 %int2_5155 = torch.constant.int 2 %int16_5156 = torch.constant.int 16 %int32_5157 = torch.constant.int 32 %int100_5158 = torch.constant.int 100 %4237 = torch.prim.ListConstruct %int-1_5153, %int26_5154, %int2_5155, %int16_5156, %int32_5157, %int100_5158 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4238 = torch.aten.view %4236, %4237 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5159 = torch.constant.none %4239 = torch.aten.clone %456, %none_5159 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5160 = torch.constant.none %4240 = torch.aten.clone %457, %none_5160 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5161 = torch.constant.int 0 %4241 = torch.aten.unsqueeze %4227, %int0_5161 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5162 = torch.constant.int 0 %int2_5163 = torch.constant.int 2 %4242 = torch.aten.select.int %4148, %int0_5162, %int2_5163 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5164 = torch.constant.int 0 %int0_5165 = torch.constant.int 0 %4243 = torch.aten.select.int %4242, %int0_5164, %int0_5165 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4244 = torch.prim.ListConstruct %4226, %4239, %4240, %4241 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5166 = torch.constant.bool false %4245 = torch.aten.index_put %4238, %4244, %4243, %false_5166 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5167 = torch.constant.int 2662400 %4246 = torch.prim.ListConstruct %731, %int2662400_5167 : (!torch.int, !torch.int) -> !torch.list %4247 = torch.aten.view %4245, %4246 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5168 = torch.constant.int -1 %int26_5169 = torch.constant.int 26 %int2_5170 = torch.constant.int 2 %int16_5171 = torch.constant.int 16 %int32_5172 = torch.constant.int 32 %int100_5173 = torch.constant.int 100 %4248 = torch.prim.ListConstruct %int-1_5168, %int26_5169, %int2_5170, %int16_5171, %int32_5172, %int100_5173 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4249 = torch.aten.view %4247, %4248 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_5174 = torch.constant.int 0 %int3_5175 = torch.constant.int 3 %4250 = torch.aten.select.int %4163, %int0_5174, %int3_5175 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5176 = torch.constant.int 0 %int3_5177 = torch.constant.int 3 %4251 = torch.aten.select.int %arg3, %int0_5176, %int3_5177 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5178 = torch.constant.int 0 %int0_5179 = torch.constant.int 0 %int9223372036854775807_5180 = torch.constant.int 9223372036854775807 %int1_5181 = torch.constant.int 1 %4252 = torch.aten.slice.Tensor %4251, %int0_5178, %int0_5179, %int9223372036854775807_5180, %int1_5181 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5182 = torch.constant.int 16 %4253 = torch.aten.floor_divide.Scalar %4250, %int16_5182 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5183 = torch.constant.int 0 %4254 = torch.aten.index_select %4252, %int0_5183, %4253 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5184 = torch.constant.int 16 %4255 = torch.aten.remainder.Scalar %4250, %int16_5184 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5185 = torch.constant.none %4256 = torch.aten.clone %458, %none_5185 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5186 = torch.constant.none %4257 = torch.aten.clone %459, %none_5186 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5187 = torch.constant.int 0 %4258 = torch.aten.unsqueeze %4255, %int0_5187 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5188 = torch.constant.int 0 %int3_5189 = torch.constant.int 3 %4259 = torch.aten.select.int %4162, %int0_5188, %int3_5189 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5190 = torch.constant.int 0 %int0_5191 = torch.constant.int 0 %4260 = torch.aten.select.int %4259, %int0_5190, %int0_5191 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4261 = torch.prim.ListConstruct %4254, %4256, %4257, %4258 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5192 = torch.constant.bool false %4262 = torch.aten.index_put %4249, %4261, %4260, %false_5192 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5193 = torch.constant.int 2662400 %4263 = torch.prim.ListConstruct %731, %int2662400_5193 : (!torch.int, !torch.int) -> !torch.list %4264 = torch.aten.view %4262, %4263 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5194 = torch.constant.int -1 %int26_5195 = torch.constant.int 26 %int2_5196 = torch.constant.int 2 %int16_5197 = torch.constant.int 16 %int32_5198 = torch.constant.int 32 %int100_5199 = torch.constant.int 100 %4265 = torch.prim.ListConstruct %int-1_5194, %int26_5195, %int2_5196, %int16_5197, %int32_5198, %int100_5199 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4266 = torch.aten.view %4264, %4265 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5200 = torch.constant.none %4267 = torch.aten.clone %460, %none_5200 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5201 = torch.constant.none %4268 = torch.aten.clone %461, %none_5201 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5202 = torch.constant.int 0 %4269 = torch.aten.unsqueeze %4255, %int0_5202 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5203 = torch.constant.int 0 %int3_5204 = torch.constant.int 3 %4270 = torch.aten.select.int %4148, %int0_5203, %int3_5204 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5205 = torch.constant.int 0 %int0_5206 = torch.constant.int 0 %4271 = torch.aten.select.int %4270, %int0_5205, %int0_5206 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4272 = torch.prim.ListConstruct %4254, %4267, %4268, %4269 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5207 = torch.constant.bool false %4273 = torch.aten.index_put %4266, %4272, %4271, %false_5207 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5208 = torch.constant.int 2662400 %4274 = torch.prim.ListConstruct %731, %int2662400_5208 : (!torch.int, !torch.int) -> !torch.list %4275 = torch.aten.view %4273, %4274 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_5209 = torch.constant.int 52 %4276 = torch.aten.mul.Scalar %arg3, %int52_5209 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int26_5210 = torch.constant.int 26 %int1_5211 = torch.constant.int 1 %4277 = torch.aten.add.Scalar %4276, %int26_5210, %int1_5211 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_5212 = torch.constant.int 4 %4278 = torch.aten.mul.int %int4_5212, %655 : !torch.int, !torch.int -> !torch.int %4279 = torch.prim.ListConstruct %4278 : (!torch.int) -> !torch.list %4280 = torch.aten.view %4277, %4279 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_5213 = torch.constant.int -1 %int26_5214 = torch.constant.int 26 %int2_5215 = torch.constant.int 2 %int16_5216 = torch.constant.int 16 %int32_5217 = torch.constant.int 32 %int100_5218 = torch.constant.int 100 %4281 = torch.prim.ListConstruct %int-1_5213, %int26_5214, %int2_5215, %int16_5216, %int32_5217, %int100_5218 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4282 = torch.aten.view %4275, %4281 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_5219 = torch.constant.int 26 %4283 = torch.aten.mul.int %731, %int26_5219 : !torch.int, !torch.int -> !torch.int %int2_5220 = torch.constant.int 2 %4284 = torch.aten.mul.int %4283, %int2_5220 : !torch.int, !torch.int -> !torch.int %int16_5221 = torch.constant.int 16 %int32_5222 = torch.constant.int 32 %int100_5223 = torch.constant.int 100 %4285 = torch.prim.ListConstruct %4284, %int16_5221, %int32_5222, %int100_5223 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4286 = torch.aten.view %4282, %4285 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_5224 = torch.constant.int 0 %4287 = torch.aten.index_select %4286, %int0_5224, %4280 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_5225 = torch.constant.int 4 %int16_5226 = torch.constant.int 16 %int32_5227 = torch.constant.int 32 %int100_5228 = torch.constant.int 100 %4288 = torch.prim.ListConstruct %int4_5225, %655, %int16_5226, %int32_5227, %int100_5228 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4289 = torch.aten.view %4287, %4288 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_5229 = torch.constant.int 1 %4290 = torch.aten.size.int %4289, %int1_5229 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_5230 = torch.constant.int 16 %4291 = torch.aten.mul.int %4290, %int16_5230 : !torch.int, !torch.int -> !torch.int %int4_5231 = torch.constant.int 4 %int32_5232 = torch.constant.int 32 %int100_5233 = torch.constant.int 100 %4292 = torch.prim.ListConstruct %int4_5231, %4291, %int32_5232, %int100_5233 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4293 = torch.aten.view %4289, %4292 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_5234 = torch.constant.int 0 %int0_5235 = torch.constant.int 0 %int9223372036854775807_5236 = torch.constant.int 9223372036854775807 %int1_5237 = torch.constant.int 1 %4294 = torch.aten.slice.Tensor %4035, %int0_5234, %int0_5235, %int9223372036854775807_5236, %int1_5237 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_5238 = torch.constant.int 16 %4295 = torch.aten.mul.int %655, %int16_5238 : !torch.int, !torch.int -> !torch.int %int1_5239 = torch.constant.int 1 %int0_5240 = torch.constant.int 0 %int1_5241 = torch.constant.int 1 %4296 = torch.aten.slice.Tensor %4294, %int1_5239, %int0_5240, %4295, %int1_5241 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_5242 = torch.constant.bool false %4297 = torch.aten.copy %4296, %4293, %false_5242 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_5243 = torch.constant.int 0 %int0_5244 = torch.constant.int 0 %int9223372036854775807_5245 = torch.constant.int 9223372036854775807 %int1_5246 = torch.constant.int 1 %4298 = torch.aten.slice.Tensor %4035, %int0_5243, %int0_5244, %int9223372036854775807_5245, %int1_5246 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5247 = torch.constant.int 1 %int0_5248 = torch.constant.int 0 %int1_5249 = torch.constant.int 1 %4299 = torch.aten.slice_scatter %4298, %4297, %int1_5247, %int0_5248, %4295, %int1_5249 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_5250 = torch.constant.int 0 %int0_5251 = torch.constant.int 0 %int9223372036854775807_5252 = torch.constant.int 9223372036854775807 %int1_5253 = torch.constant.int 1 %4300 = torch.aten.slice_scatter %4035, %4299, %int0_5250, %int0_5251, %int9223372036854775807_5252, %int1_5253 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5254 = torch.constant.int 1 %int1_5255 = torch.constant.int 1 %4301 = torch.aten.add.Scalar %4277, %int1_5254, %int1_5255 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_5256 = torch.constant.int 4 %4302 = torch.aten.mul.int %int4_5256, %655 : !torch.int, !torch.int -> !torch.int %4303 = torch.prim.ListConstruct %4302 : (!torch.int) -> !torch.list %4304 = torch.aten.view %4301, %4303 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_5257 = torch.constant.int 0 %4305 = torch.aten.index_select %4286, %int0_5257, %4304 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_5258 = torch.constant.int 4 %int16_5259 = torch.constant.int 16 %int32_5260 = torch.constant.int 32 %int100_5261 = torch.constant.int 100 %4306 = torch.prim.ListConstruct %int4_5258, %655, %int16_5259, %int32_5260, %int100_5261 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4307 = torch.aten.view %4305, %4306 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_5262 = torch.constant.int 1 %4308 = torch.aten.size.int %4307, %int1_5262 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_5263 = torch.constant.int 16 %4309 = torch.aten.mul.int %4308, %int16_5263 : !torch.int, !torch.int -> !torch.int %int4_5264 = torch.constant.int 4 %int32_5265 = torch.constant.int 32 %int100_5266 = torch.constant.int 100 %4310 = torch.prim.ListConstruct %int4_5264, %4309, %int32_5265, %int100_5266 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4311 = torch.aten.view %4307, %4310 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_5267 = torch.constant.int 0 %int0_5268 = torch.constant.int 0 %int9223372036854775807_5269 = torch.constant.int 9223372036854775807 %int1_5270 = torch.constant.int 1 %4312 = torch.aten.slice.Tensor %4052, %int0_5267, %int0_5268, %int9223372036854775807_5269, %int1_5270 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5271 = torch.constant.int 1 %int0_5272 = torch.constant.int 0 %int1_5273 = torch.constant.int 1 %4313 = torch.aten.slice.Tensor %4312, %int1_5271, %int0_5272, %4295, %int1_5273 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_5274 = torch.constant.bool false %4314 = torch.aten.copy %4313, %4311, %false_5274 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_5275 = torch.constant.int 0 %int0_5276 = torch.constant.int 0 %int9223372036854775807_5277 = torch.constant.int 9223372036854775807 %int1_5278 = torch.constant.int 1 %4315 = torch.aten.slice.Tensor %4052, %int0_5275, %int0_5276, %int9223372036854775807_5277, %int1_5278 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5279 = torch.constant.int 1 %int0_5280 = torch.constant.int 0 %int1_5281 = torch.constant.int 1 %4316 = torch.aten.slice_scatter %4315, %4314, %int1_5279, %int0_5280, %4295, %int1_5281 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_5282 = torch.constant.int 0 %int0_5283 = torch.constant.int 0 %int9223372036854775807_5284 = torch.constant.int 9223372036854775807 %int1_5285 = torch.constant.int 1 %4317 = torch.aten.slice_scatter %4052, %4316, %int0_5282, %int0_5283, %int9223372036854775807_5284, %int1_5285 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_5286 = torch.constant.int 0 %int0_5287 = torch.constant.int 0 %int9223372036854775807_5288 = torch.constant.int 9223372036854775807 %int1_5289 = torch.constant.int 1 %4318 = torch.aten.slice.Tensor %671, %int0_5286, %int0_5287, %int9223372036854775807_5288, %int1_5289 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5290 = torch.constant.int 1 %int0_5291 = torch.constant.int 0 %int1_5292 = torch.constant.int 1 %4319 = torch.aten.slice.Tensor %4318, %int1_5290, %int0_5291, %4295, %int1_5292 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_5293 = torch.constant.int 0 %int0_5294 = torch.constant.int 0 %int9223372036854775807_5295 = torch.constant.int 9223372036854775807 %int1_5296 = torch.constant.int 1 %4320 = torch.aten.slice.Tensor %673, %int0_5293, %int0_5294, %int9223372036854775807_5295, %int1_5296 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5297 = torch.constant.int 1 %int0_5298 = torch.constant.int 0 %int1_5299 = torch.constant.int 1 %4321 = torch.aten.slice.Tensor %4320, %int1_5297, %int0_5298, %4295, %int1_5299 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_5300 = torch.constant.int 1 %int2_5301 = torch.constant.int 2 %4322 = torch.aten.transpose.int %4158, %int1_5300, %int2_5301 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_5302 = torch.constant.int 4 %int32_5303 = torch.constant.int 32 %int1_5304 = torch.constant.int 1 %int100_5305 = torch.constant.int 100 %4323 = torch.prim.ListConstruct %int4_5302, %int32_5303, %int1_5304, %int100_5305 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_5306 = torch.constant.bool false %4324 = torch.aten.expand %4322, %4323, %false_5306 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_5307 = torch.constant.int 128 %int1_5308 = torch.constant.int 1 %int100_5309 = torch.constant.int 100 %4325 = torch.prim.ListConstruct %int128_5307, %int1_5308, %int100_5309 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4326 = torch.aten.view %4324, %4325 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_5310 = torch.constant.int 0 %int0_5311 = torch.constant.int 0 %int9223372036854775807_5312 = torch.constant.int 9223372036854775807 %int1_5313 = torch.constant.int 1 %4327 = torch.aten.slice.Tensor %4300, %int0_5310, %int0_5311, %int9223372036854775807_5312, %int1_5313 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5314 = torch.constant.int 1 %int0_5315 = torch.constant.int 0 %int1_5316 = torch.constant.int 1 %4328 = torch.aten.slice.Tensor %4327, %int1_5314, %int0_5315, %4295, %int1_5316 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_5317 = torch.constant.int 1 %int2_5318 = torch.constant.int 2 %4329 = torch.aten.transpose.int %4328, %int1_5317, %int2_5318 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_5319 = torch.constant.int 2 %int3_5320 = torch.constant.int 3 %4330 = torch.aten.transpose.int %4329, %int2_5319, %int3_5320 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_5321 = torch.constant.int 1 %4331 = torch.aten.size.int %4319, %int1_5321 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_5322 = torch.constant.int 4 %int32_5323 = torch.constant.int 32 %int100_5324 = torch.constant.int 100 %4332 = torch.prim.ListConstruct %int4_5322, %int32_5323, %int100_5324, %4331 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_5325 = torch.constant.bool false %4333 = torch.aten.expand %4330, %4332, %false_5325 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_5326 = torch.constant.int 0 %4334 = torch.aten.clone %4333, %int0_5326 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_5327 = torch.constant.int 128 %int100_5328 = torch.constant.int 100 %4335 = torch.prim.ListConstruct %int128_5327, %int100_5328, %4331 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4336 = torch.aten._unsafe_view %4334, %4335 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %4337 = torch.aten.bmm %4326, %4336 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_5329 = torch.constant.int 4 %int32_5330 = torch.constant.int 32 %int1_5331 = torch.constant.int 1 %4338 = torch.prim.ListConstruct %int4_5329, %int32_5330, %int1_5331, %4331 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4339 = torch.aten.view %4337, %4338 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_5332 = torch.constant.float 1.000000e+01 %4340 = torch.aten.div.Scalar %4339, %float1.000000e01_5332 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_5333 = torch.constant.int 1 %4341 = torch.aten.add.Tensor %4340, %895, %int1_5333 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_5334 = torch.constant.int -1 %false_5335 = torch.constant.bool false %4342 = torch.aten._softmax %4341, %int-1_5334, %false_5335 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_5336 = torch.constant.int 4 %int32_5337 = torch.constant.int 32 %int1_5338 = torch.constant.int 1 %4343 = torch.prim.ListConstruct %int4_5336, %int32_5337, %int1_5338, %4331 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_5339 = torch.constant.bool false %4344 = torch.aten.expand %4342, %4343, %false_5339 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_5340 = torch.constant.int 128 %int1_5341 = torch.constant.int 1 %4345 = torch.prim.ListConstruct %int128_5340, %int1_5341, %4331 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4346 = torch.aten.view %4344, %4345 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_5342 = torch.constant.int 0 %int0_5343 = torch.constant.int 0 %int9223372036854775807_5344 = torch.constant.int 9223372036854775807 %int1_5345 = torch.constant.int 1 %4347 = torch.aten.slice.Tensor %4317, %int0_5342, %int0_5343, %int9223372036854775807_5344, %int1_5345 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5346 = torch.constant.int 1 %int0_5347 = torch.constant.int 0 %int1_5348 = torch.constant.int 1 %4348 = torch.aten.slice.Tensor %4347, %int1_5346, %int0_5347, %4295, %int1_5348 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_5349 = torch.constant.int 1 %int2_5350 = torch.constant.int 2 %4349 = torch.aten.transpose.int %4348, %int1_5349, %int2_5350 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_5351 = torch.constant.int 1 %4350 = torch.aten.size.int %4321, %int1_5351 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_5352 = torch.constant.int 4 %int32_5353 = torch.constant.int 32 %int100_5354 = torch.constant.int 100 %4351 = torch.prim.ListConstruct %int4_5352, %int32_5353, %4350, %int100_5354 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_5355 = torch.constant.bool false %4352 = torch.aten.expand %4349, %4351, %false_5355 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_5356 = torch.constant.int 0 %4353 = torch.aten.clone %4352, %int0_5356 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_5357 = torch.constant.int 128 %int100_5358 = torch.constant.int 100 %4354 = torch.prim.ListConstruct %int128_5357, %4350, %int100_5358 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4355 = torch.aten._unsafe_view %4353, %4354 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %4356 = torch.aten.bmm %4346, %4355 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_5359 = torch.constant.int 4 %int32_5360 = torch.constant.int 32 %int1_5361 = torch.constant.int 1 %int100_5362 = torch.constant.int 100 %4357 = torch.prim.ListConstruct %int4_5359, %int32_5360, %int1_5361, %int100_5362 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4358 = torch.aten.view %4356, %4357 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_5363 = torch.constant.int 1 %int2_5364 = torch.constant.int 2 %4359 = torch.aten.transpose.int %4358, %int1_5363, %int2_5364 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_5365 = torch.constant.int 4 %int1_5366 = torch.constant.int 1 %int-1_5367 = torch.constant.int -1 %4360 = torch.prim.ListConstruct %int4_5365, %int1_5366, %int-1_5367 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4361 = torch.aten.view %4359, %4360 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %4362 = torch_c.to_builtin_tensor %4361 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5368 = tensor.cast %4362 : tensor<4x1x3200xf32> to tensor %4363 = torch_c.to_builtin_tensor %123 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4364 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5368, %4363) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5369 = tensor.cast %4364 : tensor to tensor<4x1x3200xf32> %4365 = torch_c.from_builtin_tensor %cast_5369 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_5370 = torch.constant.int 1 %4366 = torch.aten.add.Tensor %4123, %4365, %int1_5370 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_5371 = torch.constant.int 2 %4367 = torch.aten.pow.Tensor_Scalar %4366, %int2_5371 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_5372 = torch.constant.int -1 %4368 = torch.prim.ListConstruct %int-1_5372 : (!torch.int) -> !torch.list %true_5373 = torch.constant.bool true %none_5374 = torch.constant.none %4369 = torch.aten.mean.dim %4367, %4368, %true_5373, %none_5374 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_5375 = torch.constant.float 9.9999999747524271E-7 %int1_5376 = torch.constant.int 1 %4370 = torch.aten.add.Scalar %4369, %float9.999990e-07_5375, %int1_5376 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %4371 = torch.aten.rsqrt %4370 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %4372 = torch.aten.mul.Tensor %4366, %4371 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %4373 = torch.aten.mul.Tensor %4372, %124 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %4374 = torch_c.to_builtin_tensor %4373 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5377 = tensor.cast %4374 : tensor<4x1x3200xf32> to tensor %4375 = torch_c.to_builtin_tensor %125 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %4376 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_5377, %4375) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_5378 = tensor.cast %4376 : tensor to tensor<4x1x8640xf32> %4377 = torch_c.from_builtin_tensor %cast_5378 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %4378 = torch.aten.silu %4377 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %4379 = torch_c.to_builtin_tensor %4373 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5379 = tensor.cast %4379 : tensor<4x1x3200xf32> to tensor %4380 = torch_c.to_builtin_tensor %126 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %4381 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_5379, %4380) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_5380 = tensor.cast %4381 : tensor to tensor<4x1x8640xf32> %4382 = torch_c.from_builtin_tensor %cast_5380 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %4383 = torch.aten.mul.Tensor %4378, %4382 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %4384 = torch_c.to_builtin_tensor %4383 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_5381 = tensor.cast %4384 : tensor<4x1x8640xf32> to tensor %4385 = torch_c.to_builtin_tensor %127 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %4386 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_5381, %4385) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_5382 = tensor.cast %4386 : tensor to tensor<4x1x3200xf32> %4387 = torch_c.from_builtin_tensor %cast_5382 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_5383 = torch.constant.int 1 %4388 = torch.aten.add.Tensor %4366, %4387, %int1_5383 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_5384 = torch.constant.int 2 %4389 = torch.aten.pow.Tensor_Scalar %4388, %int2_5384 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_5385 = torch.constant.int -1 %4390 = torch.prim.ListConstruct %int-1_5385 : (!torch.int) -> !torch.list %true_5386 = torch.constant.bool true %none_5387 = torch.constant.none %4391 = torch.aten.mean.dim %4389, %4390, %true_5386, %none_5387 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_5388 = torch.constant.float 9.9999999747524271E-7 %int1_5389 = torch.constant.int 1 %4392 = torch.aten.add.Scalar %4391, %float9.999990e-07_5388, %int1_5389 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %4393 = torch.aten.rsqrt %4392 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %4394 = torch.aten.mul.Tensor %4388, %4393 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %4395 = torch.aten.mul.Tensor %4394, %128 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %4396 = torch_c.to_builtin_tensor %4395 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5390 = tensor.cast %4396 : tensor<4x1x3200xf32> to tensor %4397 = torch_c.to_builtin_tensor %129 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4398 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5390, %4397) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5391 = tensor.cast %4398 : tensor to tensor<4x1x3200xf32> %4399 = torch_c.from_builtin_tensor %cast_5391 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %4400 = torch_c.to_builtin_tensor %4395 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5392 = tensor.cast %4400 : tensor<4x1x3200xf32> to tensor %4401 = torch_c.to_builtin_tensor %130 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4402 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5392, %4401) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5393 = tensor.cast %4402 : tensor to tensor<4x1x3200xf32> %4403 = torch_c.from_builtin_tensor %cast_5393 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %4404 = torch_c.to_builtin_tensor %4395 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5394 = tensor.cast %4404 : tensor<4x1x3200xf32> to tensor %4405 = torch_c.to_builtin_tensor %131 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4406 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5394, %4405) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5395 = tensor.cast %4406 : tensor to tensor<4x1x3200xf32> %4407 = torch_c.from_builtin_tensor %cast_5395 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_5396 = torch.constant.int 4 %int1_5397 = torch.constant.int 1 %int32_5398 = torch.constant.int 32 %int100_5399 = torch.constant.int 100 %4408 = torch.prim.ListConstruct %int4_5396, %int1_5397, %int32_5398, %int100_5399 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4409 = torch.aten.view %4399, %4408 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_5400 = torch.constant.int 4 %int1_5401 = torch.constant.int 1 %int32_5402 = torch.constant.int 32 %int100_5403 = torch.constant.int 100 %4410 = torch.prim.ListConstruct %int4_5400, %int1_5401, %int32_5402, %int100_5403 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4411 = torch.aten.view %4403, %4410 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_5404 = torch.constant.int 4 %int1_5405 = torch.constant.int 1 %int32_5406 = torch.constant.int 32 %int100_5407 = torch.constant.int 100 %4412 = torch.prim.ListConstruct %int4_5404, %int1_5405, %int32_5406, %int100_5407 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4413 = torch.aten.view %4407, %4412 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_5408 = torch.constant.int 4 %int1_5409 = torch.constant.int 1 %int32_5410 = torch.constant.int 32 %int-1_5411 = torch.constant.int -1 %int2_5412 = torch.constant.int 2 %4414 = torch.prim.ListConstruct %int4_5408, %int1_5409, %int32_5410, %int-1_5411, %int2_5412 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4415 = torch.aten.view %4409, %4414 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %4416 = torch.aten.view_as_complex %4415 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_5413 = torch.constant.int 4 %int1_5414 = torch.constant.int 1 %int32_5415 = torch.constant.int 32 %int-1_5416 = torch.constant.int -1 %int2_5417 = torch.constant.int 2 %4417 = torch.prim.ListConstruct %int4_5413, %int1_5414, %int32_5415, %int-1_5416, %int2_5417 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4418 = torch.aten.view %4411, %4417 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %4419 = torch.aten.view_as_complex %4418 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %4420 = torch.aten.mul.Tensor %4416, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %4421 = torch.aten.view_as_real %4420 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_5418 = torch.constant.int 4 %int1_5419 = torch.constant.int 1 %int32_5420 = torch.constant.int 32 %int100_5421 = torch.constant.int 100 %4422 = torch.prim.ListConstruct %int4_5418, %int1_5419, %int32_5420, %int100_5421 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4423 = torch.aten.view %4421, %4422 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %4424 = torch.aten.mul.Tensor %4419, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %4425 = torch.aten.view_as_real %4424 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_5422 = torch.constant.int 4 %int1_5423 = torch.constant.int 1 %int32_5424 = torch.constant.int 32 %int100_5425 = torch.constant.int 100 %4426 = torch.prim.ListConstruct %int4_5422, %int1_5423, %int32_5424, %int100_5425 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4427 = torch.aten.view %4425, %4426 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_5426 = torch.constant.int 1 %int1_5427 = torch.constant.int 1 %4428 = torch.aten.add.Scalar %arg2, %int1_5426, %int1_5427 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_5428 = torch.constant.int 0 %int0_5429 = torch.constant.int 0 %4429 = torch.aten.select.int %4428, %int0_5428, %int0_5429 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5430 = torch.constant.int 0 %int0_5431 = torch.constant.int 0 %4430 = torch.aten.select.int %arg3, %int0_5430, %int0_5431 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5432 = torch.constant.int 0 %int0_5433 = torch.constant.int 0 %int9223372036854775807_5434 = torch.constant.int 9223372036854775807 %int1_5435 = torch.constant.int 1 %4431 = torch.aten.slice.Tensor %4430, %int0_5432, %int0_5433, %int9223372036854775807_5434, %int1_5435 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5436 = torch.constant.int 16 %4432 = torch.aten.floor_divide.Scalar %4429, %int16_5436 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5437 = torch.constant.int 0 %4433 = torch.aten.index_select %4431, %int0_5437, %4432 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5438 = torch.constant.int 16 %4434 = torch.aten.remainder.Scalar %4429, %int16_5438 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5439 = torch.constant.none %4435 = torch.aten.clone %462, %none_5439 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5440 = torch.constant.none %4436 = torch.aten.clone %463, %none_5440 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5441 = torch.constant.int 0 %4437 = torch.aten.unsqueeze %4434, %int0_5441 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5442 = torch.constant.int 0 %int0_5443 = torch.constant.int 0 %4438 = torch.aten.select.int %4427, %int0_5442, %int0_5443 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5444 = torch.constant.int 0 %int0_5445 = torch.constant.int 0 %4439 = torch.aten.select.int %4438, %int0_5444, %int0_5445 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_5446 = torch.constant.int -1 %int26_5447 = torch.constant.int 26 %int2_5448 = torch.constant.int 2 %int16_5449 = torch.constant.int 16 %int32_5450 = torch.constant.int 32 %int100_5451 = torch.constant.int 100 %4440 = torch.prim.ListConstruct %int-1_5446, %int26_5447, %int2_5448, %int16_5449, %int32_5450, %int100_5451 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4441 = torch.aten.view %4275, %4440 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %4442 = torch.prim.ListConstruct %4433, %4435, %4436, %4437 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5452 = torch.constant.bool false %4443 = torch.aten.index_put %4441, %4442, %4439, %false_5452 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5453 = torch.constant.int 2662400 %4444 = torch.prim.ListConstruct %731, %int2662400_5453 : (!torch.int, !torch.int) -> !torch.list %4445 = torch.aten.view %4443, %4444 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5454 = torch.constant.int -1 %int26_5455 = torch.constant.int 26 %int2_5456 = torch.constant.int 2 %int16_5457 = torch.constant.int 16 %int32_5458 = torch.constant.int 32 %int100_5459 = torch.constant.int 100 %4446 = torch.prim.ListConstruct %int-1_5454, %int26_5455, %int2_5456, %int16_5457, %int32_5458, %int100_5459 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4447 = torch.aten.view %4445, %4446 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5460 = torch.constant.none %4448 = torch.aten.clone %464, %none_5460 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5461 = torch.constant.none %4449 = torch.aten.clone %465, %none_5461 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5462 = torch.constant.int 0 %4450 = torch.aten.unsqueeze %4434, %int0_5462 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5463 = torch.constant.int 0 %int0_5464 = torch.constant.int 0 %4451 = torch.aten.select.int %4413, %int0_5463, %int0_5464 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5465 = torch.constant.int 0 %int0_5466 = torch.constant.int 0 %4452 = torch.aten.select.int %4451, %int0_5465, %int0_5466 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4453 = torch.prim.ListConstruct %4433, %4448, %4449, %4450 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5467 = torch.constant.bool false %4454 = torch.aten.index_put %4447, %4453, %4452, %false_5467 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5468 = torch.constant.int 2662400 %4455 = torch.prim.ListConstruct %731, %int2662400_5468 : (!torch.int, !torch.int) -> !torch.list %4456 = torch.aten.view %4454, %4455 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5469 = torch.constant.int -1 %int26_5470 = torch.constant.int 26 %int2_5471 = torch.constant.int 2 %int16_5472 = torch.constant.int 16 %int32_5473 = torch.constant.int 32 %int100_5474 = torch.constant.int 100 %4457 = torch.prim.ListConstruct %int-1_5469, %int26_5470, %int2_5471, %int16_5472, %int32_5473, %int100_5474 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4458 = torch.aten.view %4456, %4457 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_5475 = torch.constant.int 0 %int1_5476 = torch.constant.int 1 %4459 = torch.aten.select.int %4428, %int0_5475, %int1_5476 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5477 = torch.constant.int 0 %int1_5478 = torch.constant.int 1 %4460 = torch.aten.select.int %arg3, %int0_5477, %int1_5478 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5479 = torch.constant.int 0 %int0_5480 = torch.constant.int 0 %int9223372036854775807_5481 = torch.constant.int 9223372036854775807 %int1_5482 = torch.constant.int 1 %4461 = torch.aten.slice.Tensor %4460, %int0_5479, %int0_5480, %int9223372036854775807_5481, %int1_5482 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5483 = torch.constant.int 16 %4462 = torch.aten.floor_divide.Scalar %4459, %int16_5483 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5484 = torch.constant.int 0 %4463 = torch.aten.index_select %4461, %int0_5484, %4462 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5485 = torch.constant.int 16 %4464 = torch.aten.remainder.Scalar %4459, %int16_5485 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5486 = torch.constant.none %4465 = torch.aten.clone %466, %none_5486 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5487 = torch.constant.none %4466 = torch.aten.clone %467, %none_5487 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5488 = torch.constant.int 0 %4467 = torch.aten.unsqueeze %4464, %int0_5488 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5489 = torch.constant.int 0 %int1_5490 = torch.constant.int 1 %4468 = torch.aten.select.int %4427, %int0_5489, %int1_5490 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5491 = torch.constant.int 0 %int0_5492 = torch.constant.int 0 %4469 = torch.aten.select.int %4468, %int0_5491, %int0_5492 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4470 = torch.prim.ListConstruct %4463, %4465, %4466, %4467 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5493 = torch.constant.bool false %4471 = torch.aten.index_put %4458, %4470, %4469, %false_5493 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5494 = torch.constant.int 2662400 %4472 = torch.prim.ListConstruct %731, %int2662400_5494 : (!torch.int, !torch.int) -> !torch.list %4473 = torch.aten.view %4471, %4472 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5495 = torch.constant.int -1 %int26_5496 = torch.constant.int 26 %int2_5497 = torch.constant.int 2 %int16_5498 = torch.constant.int 16 %int32_5499 = torch.constant.int 32 %int100_5500 = torch.constant.int 100 %4474 = torch.prim.ListConstruct %int-1_5495, %int26_5496, %int2_5497, %int16_5498, %int32_5499, %int100_5500 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4475 = torch.aten.view %4473, %4474 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5501 = torch.constant.none %4476 = torch.aten.clone %468, %none_5501 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5502 = torch.constant.none %4477 = torch.aten.clone %469, %none_5502 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5503 = torch.constant.int 0 %4478 = torch.aten.unsqueeze %4464, %int0_5503 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5504 = torch.constant.int 0 %int1_5505 = torch.constant.int 1 %4479 = torch.aten.select.int %4413, %int0_5504, %int1_5505 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5506 = torch.constant.int 0 %int0_5507 = torch.constant.int 0 %4480 = torch.aten.select.int %4479, %int0_5506, %int0_5507 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4481 = torch.prim.ListConstruct %4463, %4476, %4477, %4478 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5508 = torch.constant.bool false %4482 = torch.aten.index_put %4475, %4481, %4480, %false_5508 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5509 = torch.constant.int 2662400 %4483 = torch.prim.ListConstruct %731, %int2662400_5509 : (!torch.int, !torch.int) -> !torch.list %4484 = torch.aten.view %4482, %4483 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5510 = torch.constant.int -1 %int26_5511 = torch.constant.int 26 %int2_5512 = torch.constant.int 2 %int16_5513 = torch.constant.int 16 %int32_5514 = torch.constant.int 32 %int100_5515 = torch.constant.int 100 %4485 = torch.prim.ListConstruct %int-1_5510, %int26_5511, %int2_5512, %int16_5513, %int32_5514, %int100_5515 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4486 = torch.aten.view %4484, %4485 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_5516 = torch.constant.int 0 %int2_5517 = torch.constant.int 2 %4487 = torch.aten.select.int %4428, %int0_5516, %int2_5517 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5518 = torch.constant.int 0 %int2_5519 = torch.constant.int 2 %4488 = torch.aten.select.int %arg3, %int0_5518, %int2_5519 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5520 = torch.constant.int 0 %int0_5521 = torch.constant.int 0 %int9223372036854775807_5522 = torch.constant.int 9223372036854775807 %int1_5523 = torch.constant.int 1 %4489 = torch.aten.slice.Tensor %4488, %int0_5520, %int0_5521, %int9223372036854775807_5522, %int1_5523 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5524 = torch.constant.int 16 %4490 = torch.aten.floor_divide.Scalar %4487, %int16_5524 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5525 = torch.constant.int 0 %4491 = torch.aten.index_select %4489, %int0_5525, %4490 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5526 = torch.constant.int 16 %4492 = torch.aten.remainder.Scalar %4487, %int16_5526 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5527 = torch.constant.none %4493 = torch.aten.clone %470, %none_5527 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5528 = torch.constant.none %4494 = torch.aten.clone %471, %none_5528 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5529 = torch.constant.int 0 %4495 = torch.aten.unsqueeze %4492, %int0_5529 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5530 = torch.constant.int 0 %int2_5531 = torch.constant.int 2 %4496 = torch.aten.select.int %4427, %int0_5530, %int2_5531 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5532 = torch.constant.int 0 %int0_5533 = torch.constant.int 0 %4497 = torch.aten.select.int %4496, %int0_5532, %int0_5533 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4498 = torch.prim.ListConstruct %4491, %4493, %4494, %4495 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5534 = torch.constant.bool false %4499 = torch.aten.index_put %4486, %4498, %4497, %false_5534 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5535 = torch.constant.int 2662400 %4500 = torch.prim.ListConstruct %731, %int2662400_5535 : (!torch.int, !torch.int) -> !torch.list %4501 = torch.aten.view %4499, %4500 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5536 = torch.constant.int -1 %int26_5537 = torch.constant.int 26 %int2_5538 = torch.constant.int 2 %int16_5539 = torch.constant.int 16 %int32_5540 = torch.constant.int 32 %int100_5541 = torch.constant.int 100 %4502 = torch.prim.ListConstruct %int-1_5536, %int26_5537, %int2_5538, %int16_5539, %int32_5540, %int100_5541 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4503 = torch.aten.view %4501, %4502 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5542 = torch.constant.none %4504 = torch.aten.clone %472, %none_5542 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5543 = torch.constant.none %4505 = torch.aten.clone %473, %none_5543 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5544 = torch.constant.int 0 %4506 = torch.aten.unsqueeze %4492, %int0_5544 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5545 = torch.constant.int 0 %int2_5546 = torch.constant.int 2 %4507 = torch.aten.select.int %4413, %int0_5545, %int2_5546 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5547 = torch.constant.int 0 %int0_5548 = torch.constant.int 0 %4508 = torch.aten.select.int %4507, %int0_5547, %int0_5548 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4509 = torch.prim.ListConstruct %4491, %4504, %4505, %4506 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5549 = torch.constant.bool false %4510 = torch.aten.index_put %4503, %4509, %4508, %false_5549 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5550 = torch.constant.int 2662400 %4511 = torch.prim.ListConstruct %731, %int2662400_5550 : (!torch.int, !torch.int) -> !torch.list %4512 = torch.aten.view %4510, %4511 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5551 = torch.constant.int -1 %int26_5552 = torch.constant.int 26 %int2_5553 = torch.constant.int 2 %int16_5554 = torch.constant.int 16 %int32_5555 = torch.constant.int 32 %int100_5556 = torch.constant.int 100 %4513 = torch.prim.ListConstruct %int-1_5551, %int26_5552, %int2_5553, %int16_5554, %int32_5555, %int100_5556 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4514 = torch.aten.view %4512, %4513 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_5557 = torch.constant.int 0 %int3_5558 = torch.constant.int 3 %4515 = torch.aten.select.int %4428, %int0_5557, %int3_5558 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5559 = torch.constant.int 0 %int3_5560 = torch.constant.int 3 %4516 = torch.aten.select.int %arg3, %int0_5559, %int3_5560 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5561 = torch.constant.int 0 %int0_5562 = torch.constant.int 0 %int9223372036854775807_5563 = torch.constant.int 9223372036854775807 %int1_5564 = torch.constant.int 1 %4517 = torch.aten.slice.Tensor %4516, %int0_5561, %int0_5562, %int9223372036854775807_5563, %int1_5564 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5565 = torch.constant.int 16 %4518 = torch.aten.floor_divide.Scalar %4515, %int16_5565 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5566 = torch.constant.int 0 %4519 = torch.aten.index_select %4517, %int0_5566, %4518 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5567 = torch.constant.int 16 %4520 = torch.aten.remainder.Scalar %4515, %int16_5567 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5568 = torch.constant.none %4521 = torch.aten.clone %474, %none_5568 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5569 = torch.constant.none %4522 = torch.aten.clone %475, %none_5569 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5570 = torch.constant.int 0 %4523 = torch.aten.unsqueeze %4520, %int0_5570 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5571 = torch.constant.int 0 %int3_5572 = torch.constant.int 3 %4524 = torch.aten.select.int %4427, %int0_5571, %int3_5572 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5573 = torch.constant.int 0 %int0_5574 = torch.constant.int 0 %4525 = torch.aten.select.int %4524, %int0_5573, %int0_5574 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4526 = torch.prim.ListConstruct %4519, %4521, %4522, %4523 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5575 = torch.constant.bool false %4527 = torch.aten.index_put %4514, %4526, %4525, %false_5575 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5576 = torch.constant.int 2662400 %4528 = torch.prim.ListConstruct %731, %int2662400_5576 : (!torch.int, !torch.int) -> !torch.list %4529 = torch.aten.view %4527, %4528 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5577 = torch.constant.int -1 %int26_5578 = torch.constant.int 26 %int2_5579 = torch.constant.int 2 %int16_5580 = torch.constant.int 16 %int32_5581 = torch.constant.int 32 %int100_5582 = torch.constant.int 100 %4530 = torch.prim.ListConstruct %int-1_5577, %int26_5578, %int2_5579, %int16_5580, %int32_5581, %int100_5582 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4531 = torch.aten.view %4529, %4530 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5583 = torch.constant.none %4532 = torch.aten.clone %476, %none_5583 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5584 = torch.constant.none %4533 = torch.aten.clone %477, %none_5584 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5585 = torch.constant.int 0 %4534 = torch.aten.unsqueeze %4520, %int0_5585 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5586 = torch.constant.int 0 %int3_5587 = torch.constant.int 3 %4535 = torch.aten.select.int %4413, %int0_5586, %int3_5587 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5588 = torch.constant.int 0 %int0_5589 = torch.constant.int 0 %4536 = torch.aten.select.int %4535, %int0_5588, %int0_5589 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4537 = torch.prim.ListConstruct %4519, %4532, %4533, %4534 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5590 = torch.constant.bool false %4538 = torch.aten.index_put %4531, %4537, %4536, %false_5590 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5591 = torch.constant.int 2662400 %4539 = torch.prim.ListConstruct %731, %int2662400_5591 : (!torch.int, !torch.int) -> !torch.list %4540 = torch.aten.view %4538, %4539 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_5592 = torch.constant.int 52 %4541 = torch.aten.mul.Scalar %arg3, %int52_5592 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int28 = torch.constant.int 28 %int1_5593 = torch.constant.int 1 %4542 = torch.aten.add.Scalar %4541, %int28, %int1_5593 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_5594 = torch.constant.int 4 %4543 = torch.aten.mul.int %int4_5594, %655 : !torch.int, !torch.int -> !torch.int %4544 = torch.prim.ListConstruct %4543 : (!torch.int) -> !torch.list %4545 = torch.aten.view %4542, %4544 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_5595 = torch.constant.int -1 %int26_5596 = torch.constant.int 26 %int2_5597 = torch.constant.int 2 %int16_5598 = torch.constant.int 16 %int32_5599 = torch.constant.int 32 %int100_5600 = torch.constant.int 100 %4546 = torch.prim.ListConstruct %int-1_5595, %int26_5596, %int2_5597, %int16_5598, %int32_5599, %int100_5600 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4547 = torch.aten.view %4540, %4546 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_5601 = torch.constant.int 26 %4548 = torch.aten.mul.int %731, %int26_5601 : !torch.int, !torch.int -> !torch.int %int2_5602 = torch.constant.int 2 %4549 = torch.aten.mul.int %4548, %int2_5602 : !torch.int, !torch.int -> !torch.int %int16_5603 = torch.constant.int 16 %int32_5604 = torch.constant.int 32 %int100_5605 = torch.constant.int 100 %4550 = torch.prim.ListConstruct %4549, %int16_5603, %int32_5604, %int100_5605 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4551 = torch.aten.view %4547, %4550 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_5606 = torch.constant.int 0 %4552 = torch.aten.index_select %4551, %int0_5606, %4545 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_5607 = torch.constant.int 4 %int16_5608 = torch.constant.int 16 %int32_5609 = torch.constant.int 32 %int100_5610 = torch.constant.int 100 %4553 = torch.prim.ListConstruct %int4_5607, %655, %int16_5608, %int32_5609, %int100_5610 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4554 = torch.aten.view %4552, %4553 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_5611 = torch.constant.int 1 %4555 = torch.aten.size.int %4554, %int1_5611 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_5612 = torch.constant.int 16 %4556 = torch.aten.mul.int %4555, %int16_5612 : !torch.int, !torch.int -> !torch.int %int4_5613 = torch.constant.int 4 %int32_5614 = torch.constant.int 32 %int100_5615 = torch.constant.int 100 %4557 = torch.prim.ListConstruct %int4_5613, %4556, %int32_5614, %int100_5615 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4558 = torch.aten.view %4554, %4557 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_5616 = torch.constant.int 0 %int0_5617 = torch.constant.int 0 %int9223372036854775807_5618 = torch.constant.int 9223372036854775807 %int1_5619 = torch.constant.int 1 %4559 = torch.aten.slice.Tensor %4300, %int0_5616, %int0_5617, %int9223372036854775807_5618, %int1_5619 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_5620 = torch.constant.int 16 %4560 = torch.aten.mul.int %655, %int16_5620 : !torch.int, !torch.int -> !torch.int %int1_5621 = torch.constant.int 1 %int0_5622 = torch.constant.int 0 %int1_5623 = torch.constant.int 1 %4561 = torch.aten.slice.Tensor %4559, %int1_5621, %int0_5622, %4560, %int1_5623 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_5624 = torch.constant.bool false %4562 = torch.aten.copy %4561, %4558, %false_5624 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_5625 = torch.constant.int 0 %int0_5626 = torch.constant.int 0 %int9223372036854775807_5627 = torch.constant.int 9223372036854775807 %int1_5628 = torch.constant.int 1 %4563 = torch.aten.slice.Tensor %4300, %int0_5625, %int0_5626, %int9223372036854775807_5627, %int1_5628 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5629 = torch.constant.int 1 %int0_5630 = torch.constant.int 0 %int1_5631 = torch.constant.int 1 %4564 = torch.aten.slice_scatter %4563, %4562, %int1_5629, %int0_5630, %4560, %int1_5631 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_5632 = torch.constant.int 0 %int0_5633 = torch.constant.int 0 %int9223372036854775807_5634 = torch.constant.int 9223372036854775807 %int1_5635 = torch.constant.int 1 %4565 = torch.aten.slice_scatter %4300, %4564, %int0_5632, %int0_5633, %int9223372036854775807_5634, %int1_5635 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5636 = torch.constant.int 1 %int1_5637 = torch.constant.int 1 %4566 = torch.aten.add.Scalar %4542, %int1_5636, %int1_5637 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_5638 = torch.constant.int 4 %4567 = torch.aten.mul.int %int4_5638, %655 : !torch.int, !torch.int -> !torch.int %4568 = torch.prim.ListConstruct %4567 : (!torch.int) -> !torch.list %4569 = torch.aten.view %4566, %4568 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_5639 = torch.constant.int 0 %4570 = torch.aten.index_select %4551, %int0_5639, %4569 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_5640 = torch.constant.int 4 %int16_5641 = torch.constant.int 16 %int32_5642 = torch.constant.int 32 %int100_5643 = torch.constant.int 100 %4571 = torch.prim.ListConstruct %int4_5640, %655, %int16_5641, %int32_5642, %int100_5643 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4572 = torch.aten.view %4570, %4571 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_5644 = torch.constant.int 1 %4573 = torch.aten.size.int %4572, %int1_5644 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_5645 = torch.constant.int 16 %4574 = torch.aten.mul.int %4573, %int16_5645 : !torch.int, !torch.int -> !torch.int %int4_5646 = torch.constant.int 4 %int32_5647 = torch.constant.int 32 %int100_5648 = torch.constant.int 100 %4575 = torch.prim.ListConstruct %int4_5646, %4574, %int32_5647, %int100_5648 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4576 = torch.aten.view %4572, %4575 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_5649 = torch.constant.int 0 %int0_5650 = torch.constant.int 0 %int9223372036854775807_5651 = torch.constant.int 9223372036854775807 %int1_5652 = torch.constant.int 1 %4577 = torch.aten.slice.Tensor %4317, %int0_5649, %int0_5650, %int9223372036854775807_5651, %int1_5652 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5653 = torch.constant.int 1 %int0_5654 = torch.constant.int 0 %int1_5655 = torch.constant.int 1 %4578 = torch.aten.slice.Tensor %4577, %int1_5653, %int0_5654, %4560, %int1_5655 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_5656 = torch.constant.bool false %4579 = torch.aten.copy %4578, %4576, %false_5656 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_5657 = torch.constant.int 0 %int0_5658 = torch.constant.int 0 %int9223372036854775807_5659 = torch.constant.int 9223372036854775807 %int1_5660 = torch.constant.int 1 %4580 = torch.aten.slice.Tensor %4317, %int0_5657, %int0_5658, %int9223372036854775807_5659, %int1_5660 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5661 = torch.constant.int 1 %int0_5662 = torch.constant.int 0 %int1_5663 = torch.constant.int 1 %4581 = torch.aten.slice_scatter %4580, %4579, %int1_5661, %int0_5662, %4560, %int1_5663 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_5664 = torch.constant.int 0 %int0_5665 = torch.constant.int 0 %int9223372036854775807_5666 = torch.constant.int 9223372036854775807 %int1_5667 = torch.constant.int 1 %4582 = torch.aten.slice_scatter %4317, %4581, %int0_5664, %int0_5665, %int9223372036854775807_5666, %int1_5667 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_5668 = torch.constant.int 0 %int0_5669 = torch.constant.int 0 %int9223372036854775807_5670 = torch.constant.int 9223372036854775807 %int1_5671 = torch.constant.int 1 %4583 = torch.aten.slice.Tensor %671, %int0_5668, %int0_5669, %int9223372036854775807_5670, %int1_5671 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5672 = torch.constant.int 1 %int0_5673 = torch.constant.int 0 %int1_5674 = torch.constant.int 1 %4584 = torch.aten.slice.Tensor %4583, %int1_5672, %int0_5673, %4560, %int1_5674 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_5675 = torch.constant.int 0 %int0_5676 = torch.constant.int 0 %int9223372036854775807_5677 = torch.constant.int 9223372036854775807 %int1_5678 = torch.constant.int 1 %4585 = torch.aten.slice.Tensor %673, %int0_5675, %int0_5676, %int9223372036854775807_5677, %int1_5678 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5679 = torch.constant.int 1 %int0_5680 = torch.constant.int 0 %int1_5681 = torch.constant.int 1 %4586 = torch.aten.slice.Tensor %4585, %int1_5679, %int0_5680, %4560, %int1_5681 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_5682 = torch.constant.int 1 %int2_5683 = torch.constant.int 2 %4587 = torch.aten.transpose.int %4423, %int1_5682, %int2_5683 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_5684 = torch.constant.int 4 %int32_5685 = torch.constant.int 32 %int1_5686 = torch.constant.int 1 %int100_5687 = torch.constant.int 100 %4588 = torch.prim.ListConstruct %int4_5684, %int32_5685, %int1_5686, %int100_5687 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_5688 = torch.constant.bool false %4589 = torch.aten.expand %4587, %4588, %false_5688 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_5689 = torch.constant.int 128 %int1_5690 = torch.constant.int 1 %int100_5691 = torch.constant.int 100 %4590 = torch.prim.ListConstruct %int128_5689, %int1_5690, %int100_5691 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4591 = torch.aten.view %4589, %4590 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_5692 = torch.constant.int 0 %int0_5693 = torch.constant.int 0 %int9223372036854775807_5694 = torch.constant.int 9223372036854775807 %int1_5695 = torch.constant.int 1 %4592 = torch.aten.slice.Tensor %4565, %int0_5692, %int0_5693, %int9223372036854775807_5694, %int1_5695 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5696 = torch.constant.int 1 %int0_5697 = torch.constant.int 0 %int1_5698 = torch.constant.int 1 %4593 = torch.aten.slice.Tensor %4592, %int1_5696, %int0_5697, %4560, %int1_5698 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_5699 = torch.constant.int 1 %int2_5700 = torch.constant.int 2 %4594 = torch.aten.transpose.int %4593, %int1_5699, %int2_5700 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_5701 = torch.constant.int 2 %int3_5702 = torch.constant.int 3 %4595 = torch.aten.transpose.int %4594, %int2_5701, %int3_5702 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_5703 = torch.constant.int 1 %4596 = torch.aten.size.int %4584, %int1_5703 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_5704 = torch.constant.int 4 %int32_5705 = torch.constant.int 32 %int100_5706 = torch.constant.int 100 %4597 = torch.prim.ListConstruct %int4_5704, %int32_5705, %int100_5706, %4596 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_5707 = torch.constant.bool false %4598 = torch.aten.expand %4595, %4597, %false_5707 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_5708 = torch.constant.int 0 %4599 = torch.aten.clone %4598, %int0_5708 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_5709 = torch.constant.int 128 %int100_5710 = torch.constant.int 100 %4600 = torch.prim.ListConstruct %int128_5709, %int100_5710, %4596 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4601 = torch.aten._unsafe_view %4599, %4600 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %4602 = torch.aten.bmm %4591, %4601 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_5711 = torch.constant.int 4 %int32_5712 = torch.constant.int 32 %int1_5713 = torch.constant.int 1 %4603 = torch.prim.ListConstruct %int4_5711, %int32_5712, %int1_5713, %4596 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4604 = torch.aten.view %4602, %4603 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_5714 = torch.constant.float 1.000000e+01 %4605 = torch.aten.div.Scalar %4604, %float1.000000e01_5714 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_5715 = torch.constant.int 1 %4606 = torch.aten.add.Tensor %4605, %895, %int1_5715 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_5716 = torch.constant.int -1 %false_5717 = torch.constant.bool false %4607 = torch.aten._softmax %4606, %int-1_5716, %false_5717 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_5718 = torch.constant.int 4 %int32_5719 = torch.constant.int 32 %int1_5720 = torch.constant.int 1 %4608 = torch.prim.ListConstruct %int4_5718, %int32_5719, %int1_5720, %4596 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_5721 = torch.constant.bool false %4609 = torch.aten.expand %4607, %4608, %false_5721 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_5722 = torch.constant.int 128 %int1_5723 = torch.constant.int 1 %4610 = torch.prim.ListConstruct %int128_5722, %int1_5723, %4596 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4611 = torch.aten.view %4609, %4610 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_5724 = torch.constant.int 0 %int0_5725 = torch.constant.int 0 %int9223372036854775807_5726 = torch.constant.int 9223372036854775807 %int1_5727 = torch.constant.int 1 %4612 = torch.aten.slice.Tensor %4582, %int0_5724, %int0_5725, %int9223372036854775807_5726, %int1_5727 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_5728 = torch.constant.int 1 %int0_5729 = torch.constant.int 0 %int1_5730 = torch.constant.int 1 %4613 = torch.aten.slice.Tensor %4612, %int1_5728, %int0_5729, %4560, %int1_5730 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_5731 = torch.constant.int 1 %int2_5732 = torch.constant.int 2 %4614 = torch.aten.transpose.int %4613, %int1_5731, %int2_5732 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_5733 = torch.constant.int 1 %4615 = torch.aten.size.int %4586, %int1_5733 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_5734 = torch.constant.int 4 %int32_5735 = torch.constant.int 32 %int100_5736 = torch.constant.int 100 %4616 = torch.prim.ListConstruct %int4_5734, %int32_5735, %4615, %int100_5736 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_5737 = torch.constant.bool false %4617 = torch.aten.expand %4614, %4616, %false_5737 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_5738 = torch.constant.int 0 %4618 = torch.aten.clone %4617, %int0_5738 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_5739 = torch.constant.int 128 %int100_5740 = torch.constant.int 100 %4619 = torch.prim.ListConstruct %int128_5739, %4615, %int100_5740 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4620 = torch.aten._unsafe_view %4618, %4619 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %4621 = torch.aten.bmm %4611, %4620 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_5741 = torch.constant.int 4 %int32_5742 = torch.constant.int 32 %int1_5743 = torch.constant.int 1 %int100_5744 = torch.constant.int 100 %4622 = torch.prim.ListConstruct %int4_5741, %int32_5742, %int1_5743, %int100_5744 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4623 = torch.aten.view %4621, %4622 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_5745 = torch.constant.int 1 %int2_5746 = torch.constant.int 2 %4624 = torch.aten.transpose.int %4623, %int1_5745, %int2_5746 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_5747 = torch.constant.int 4 %int1_5748 = torch.constant.int 1 %int-1_5749 = torch.constant.int -1 %4625 = torch.prim.ListConstruct %int4_5747, %int1_5748, %int-1_5749 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4626 = torch.aten.view %4624, %4625 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %4627 = torch_c.to_builtin_tensor %4626 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5750 = tensor.cast %4627 : tensor<4x1x3200xf32> to tensor %4628 = torch_c.to_builtin_tensor %132 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4629 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5750, %4628) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5751 = tensor.cast %4629 : tensor to tensor<4x1x3200xf32> %4630 = torch_c.from_builtin_tensor %cast_5751 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_5752 = torch.constant.int 1 %4631 = torch.aten.add.Tensor %4388, %4630, %int1_5752 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_5753 = torch.constant.int 2 %4632 = torch.aten.pow.Tensor_Scalar %4631, %int2_5753 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_5754 = torch.constant.int -1 %4633 = torch.prim.ListConstruct %int-1_5754 : (!torch.int) -> !torch.list %true_5755 = torch.constant.bool true %none_5756 = torch.constant.none %4634 = torch.aten.mean.dim %4632, %4633, %true_5755, %none_5756 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_5757 = torch.constant.float 9.9999999747524271E-7 %int1_5758 = torch.constant.int 1 %4635 = torch.aten.add.Scalar %4634, %float9.999990e-07_5757, %int1_5758 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %4636 = torch.aten.rsqrt %4635 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %4637 = torch.aten.mul.Tensor %4631, %4636 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %4638 = torch.aten.mul.Tensor %4637, %133 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %4639 = torch_c.to_builtin_tensor %4638 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5759 = tensor.cast %4639 : tensor<4x1x3200xf32> to tensor %4640 = torch_c.to_builtin_tensor %134 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %4641 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_5759, %4640) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_5760 = tensor.cast %4641 : tensor to tensor<4x1x8640xf32> %4642 = torch_c.from_builtin_tensor %cast_5760 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %4643 = torch.aten.silu %4642 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %4644 = torch_c.to_builtin_tensor %4638 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5761 = tensor.cast %4644 : tensor<4x1x3200xf32> to tensor %4645 = torch_c.to_builtin_tensor %135 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %4646 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_5761, %4645) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_5762 = tensor.cast %4646 : tensor to tensor<4x1x8640xf32> %4647 = torch_c.from_builtin_tensor %cast_5762 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %4648 = torch.aten.mul.Tensor %4643, %4647 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %4649 = torch_c.to_builtin_tensor %4648 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_5763 = tensor.cast %4649 : tensor<4x1x8640xf32> to tensor %4650 = torch_c.to_builtin_tensor %136 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %4651 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_5763, %4650) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_5764 = tensor.cast %4651 : tensor to tensor<4x1x3200xf32> %4652 = torch_c.from_builtin_tensor %cast_5764 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_5765 = torch.constant.int 1 %4653 = torch.aten.add.Tensor %4631, %4652, %int1_5765 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_5766 = torch.constant.int 2 %4654 = torch.aten.pow.Tensor_Scalar %4653, %int2_5766 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_5767 = torch.constant.int -1 %4655 = torch.prim.ListConstruct %int-1_5767 : (!torch.int) -> !torch.list %true_5768 = torch.constant.bool true %none_5769 = torch.constant.none %4656 = torch.aten.mean.dim %4654, %4655, %true_5768, %none_5769 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_5770 = torch.constant.float 9.9999999747524271E-7 %int1_5771 = torch.constant.int 1 %4657 = torch.aten.add.Scalar %4656, %float9.999990e-07_5770, %int1_5771 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %4658 = torch.aten.rsqrt %4657 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %4659 = torch.aten.mul.Tensor %4653, %4658 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %4660 = torch.aten.mul.Tensor %4659, %137 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %4661 = torch_c.to_builtin_tensor %4660 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5772 = tensor.cast %4661 : tensor<4x1x3200xf32> to tensor %4662 = torch_c.to_builtin_tensor %138 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4663 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5772, %4662) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5773 = tensor.cast %4663 : tensor to tensor<4x1x3200xf32> %4664 = torch_c.from_builtin_tensor %cast_5773 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %4665 = torch_c.to_builtin_tensor %4660 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5774 = tensor.cast %4665 : tensor<4x1x3200xf32> to tensor %4666 = torch_c.to_builtin_tensor %139 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4667 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5774, %4666) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5775 = tensor.cast %4667 : tensor to tensor<4x1x3200xf32> %4668 = torch_c.from_builtin_tensor %cast_5775 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %4669 = torch_c.to_builtin_tensor %4660 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_5776 = tensor.cast %4669 : tensor<4x1x3200xf32> to tensor %4670 = torch_c.to_builtin_tensor %140 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4671 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_5776, %4670) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_5777 = tensor.cast %4671 : tensor to tensor<4x1x3200xf32> %4672 = torch_c.from_builtin_tensor %cast_5777 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_5778 = torch.constant.int 4 %int1_5779 = torch.constant.int 1 %int32_5780 = torch.constant.int 32 %int100_5781 = torch.constant.int 100 %4673 = torch.prim.ListConstruct %int4_5778, %int1_5779, %int32_5780, %int100_5781 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4674 = torch.aten.view %4664, %4673 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_5782 = torch.constant.int 4 %int1_5783 = torch.constant.int 1 %int32_5784 = torch.constant.int 32 %int100_5785 = torch.constant.int 100 %4675 = torch.prim.ListConstruct %int4_5782, %int1_5783, %int32_5784, %int100_5785 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4676 = torch.aten.view %4668, %4675 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_5786 = torch.constant.int 4 %int1_5787 = torch.constant.int 1 %int32_5788 = torch.constant.int 32 %int100_5789 = torch.constant.int 100 %4677 = torch.prim.ListConstruct %int4_5786, %int1_5787, %int32_5788, %int100_5789 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4678 = torch.aten.view %4672, %4677 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_5790 = torch.constant.int 4 %int1_5791 = torch.constant.int 1 %int32_5792 = torch.constant.int 32 %int-1_5793 = torch.constant.int -1 %int2_5794 = torch.constant.int 2 %4679 = torch.prim.ListConstruct %int4_5790, %int1_5791, %int32_5792, %int-1_5793, %int2_5794 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4680 = torch.aten.view %4674, %4679 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %4681 = torch.aten.view_as_complex %4680 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_5795 = torch.constant.int 4 %int1_5796 = torch.constant.int 1 %int32_5797 = torch.constant.int 32 %int-1_5798 = torch.constant.int -1 %int2_5799 = torch.constant.int 2 %4682 = torch.prim.ListConstruct %int4_5795, %int1_5796, %int32_5797, %int-1_5798, %int2_5799 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4683 = torch.aten.view %4676, %4682 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %4684 = torch.aten.view_as_complex %4683 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %4685 = torch.aten.mul.Tensor %4681, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %4686 = torch.aten.view_as_real %4685 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_5800 = torch.constant.int 4 %int1_5801 = torch.constant.int 1 %int32_5802 = torch.constant.int 32 %int100_5803 = torch.constant.int 100 %4687 = torch.prim.ListConstruct %int4_5800, %int1_5801, %int32_5802, %int100_5803 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4688 = torch.aten.view %4686, %4687 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %4689 = torch.aten.mul.Tensor %4684, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %4690 = torch.aten.view_as_real %4689 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_5804 = torch.constant.int 4 %int1_5805 = torch.constant.int 1 %int32_5806 = torch.constant.int 32 %int100_5807 = torch.constant.int 100 %4691 = torch.prim.ListConstruct %int4_5804, %int1_5805, %int32_5806, %int100_5807 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4692 = torch.aten.view %4690, %4691 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_5808 = torch.constant.int 1 %int1_5809 = torch.constant.int 1 %4693 = torch.aten.add.Scalar %arg2, %int1_5808, %int1_5809 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_5810 = torch.constant.int 0 %int0_5811 = torch.constant.int 0 %4694 = torch.aten.select.int %4693, %int0_5810, %int0_5811 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5812 = torch.constant.int 0 %int0_5813 = torch.constant.int 0 %4695 = torch.aten.select.int %arg3, %int0_5812, %int0_5813 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5814 = torch.constant.int 0 %int0_5815 = torch.constant.int 0 %int9223372036854775807_5816 = torch.constant.int 9223372036854775807 %int1_5817 = torch.constant.int 1 %4696 = torch.aten.slice.Tensor %4695, %int0_5814, %int0_5815, %int9223372036854775807_5816, %int1_5817 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5818 = torch.constant.int 16 %4697 = torch.aten.floor_divide.Scalar %4694, %int16_5818 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5819 = torch.constant.int 0 %4698 = torch.aten.index_select %4696, %int0_5819, %4697 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5820 = torch.constant.int 16 %4699 = torch.aten.remainder.Scalar %4694, %int16_5820 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5821 = torch.constant.none %4700 = torch.aten.clone %478, %none_5821 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5822 = torch.constant.none %4701 = torch.aten.clone %479, %none_5822 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5823 = torch.constant.int 0 %4702 = torch.aten.unsqueeze %4699, %int0_5823 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5824 = torch.constant.int 0 %int0_5825 = torch.constant.int 0 %4703 = torch.aten.select.int %4692, %int0_5824, %int0_5825 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5826 = torch.constant.int 0 %int0_5827 = torch.constant.int 0 %4704 = torch.aten.select.int %4703, %int0_5826, %int0_5827 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_5828 = torch.constant.int -1 %int26_5829 = torch.constant.int 26 %int2_5830 = torch.constant.int 2 %int16_5831 = torch.constant.int 16 %int32_5832 = torch.constant.int 32 %int100_5833 = torch.constant.int 100 %4705 = torch.prim.ListConstruct %int-1_5828, %int26_5829, %int2_5830, %int16_5831, %int32_5832, %int100_5833 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4706 = torch.aten.view %4540, %4705 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %4707 = torch.prim.ListConstruct %4698, %4700, %4701, %4702 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5834 = torch.constant.bool false %4708 = torch.aten.index_put %4706, %4707, %4704, %false_5834 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5835 = torch.constant.int 2662400 %4709 = torch.prim.ListConstruct %731, %int2662400_5835 : (!torch.int, !torch.int) -> !torch.list %4710 = torch.aten.view %4708, %4709 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5836 = torch.constant.int -1 %int26_5837 = torch.constant.int 26 %int2_5838 = torch.constant.int 2 %int16_5839 = torch.constant.int 16 %int32_5840 = torch.constant.int 32 %int100_5841 = torch.constant.int 100 %4711 = torch.prim.ListConstruct %int-1_5836, %int26_5837, %int2_5838, %int16_5839, %int32_5840, %int100_5841 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4712 = torch.aten.view %4710, %4711 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5842 = torch.constant.none %4713 = torch.aten.clone %480, %none_5842 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5843 = torch.constant.none %4714 = torch.aten.clone %481, %none_5843 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5844 = torch.constant.int 0 %4715 = torch.aten.unsqueeze %4699, %int0_5844 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5845 = torch.constant.int 0 %int0_5846 = torch.constant.int 0 %4716 = torch.aten.select.int %4678, %int0_5845, %int0_5846 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5847 = torch.constant.int 0 %int0_5848 = torch.constant.int 0 %4717 = torch.aten.select.int %4716, %int0_5847, %int0_5848 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4718 = torch.prim.ListConstruct %4698, %4713, %4714, %4715 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5849 = torch.constant.bool false %4719 = torch.aten.index_put %4712, %4718, %4717, %false_5849 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5850 = torch.constant.int 2662400 %4720 = torch.prim.ListConstruct %731, %int2662400_5850 : (!torch.int, !torch.int) -> !torch.list %4721 = torch.aten.view %4719, %4720 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5851 = torch.constant.int -1 %int26_5852 = torch.constant.int 26 %int2_5853 = torch.constant.int 2 %int16_5854 = torch.constant.int 16 %int32_5855 = torch.constant.int 32 %int100_5856 = torch.constant.int 100 %4722 = torch.prim.ListConstruct %int-1_5851, %int26_5852, %int2_5853, %int16_5854, %int32_5855, %int100_5856 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4723 = torch.aten.view %4721, %4722 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_5857 = torch.constant.int 0 %int1_5858 = torch.constant.int 1 %4724 = torch.aten.select.int %4693, %int0_5857, %int1_5858 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5859 = torch.constant.int 0 %int1_5860 = torch.constant.int 1 %4725 = torch.aten.select.int %arg3, %int0_5859, %int1_5860 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5861 = torch.constant.int 0 %int0_5862 = torch.constant.int 0 %int9223372036854775807_5863 = torch.constant.int 9223372036854775807 %int1_5864 = torch.constant.int 1 %4726 = torch.aten.slice.Tensor %4725, %int0_5861, %int0_5862, %int9223372036854775807_5863, %int1_5864 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5865 = torch.constant.int 16 %4727 = torch.aten.floor_divide.Scalar %4724, %int16_5865 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5866 = torch.constant.int 0 %4728 = torch.aten.index_select %4726, %int0_5866, %4727 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5867 = torch.constant.int 16 %4729 = torch.aten.remainder.Scalar %4724, %int16_5867 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5868 = torch.constant.none %4730 = torch.aten.clone %482, %none_5868 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5869 = torch.constant.none %4731 = torch.aten.clone %483, %none_5869 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5870 = torch.constant.int 0 %4732 = torch.aten.unsqueeze %4729, %int0_5870 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5871 = torch.constant.int 0 %int1_5872 = torch.constant.int 1 %4733 = torch.aten.select.int %4692, %int0_5871, %int1_5872 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5873 = torch.constant.int 0 %int0_5874 = torch.constant.int 0 %4734 = torch.aten.select.int %4733, %int0_5873, %int0_5874 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4735 = torch.prim.ListConstruct %4728, %4730, %4731, %4732 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5875 = torch.constant.bool false %4736 = torch.aten.index_put %4723, %4735, %4734, %false_5875 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5876 = torch.constant.int 2662400 %4737 = torch.prim.ListConstruct %731, %int2662400_5876 : (!torch.int, !torch.int) -> !torch.list %4738 = torch.aten.view %4736, %4737 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5877 = torch.constant.int -1 %int26_5878 = torch.constant.int 26 %int2_5879 = torch.constant.int 2 %int16_5880 = torch.constant.int 16 %int32_5881 = torch.constant.int 32 %int100_5882 = torch.constant.int 100 %4739 = torch.prim.ListConstruct %int-1_5877, %int26_5878, %int2_5879, %int16_5880, %int32_5881, %int100_5882 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4740 = torch.aten.view %4738, %4739 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5883 = torch.constant.none %4741 = torch.aten.clone %484, %none_5883 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5884 = torch.constant.none %4742 = torch.aten.clone %485, %none_5884 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5885 = torch.constant.int 0 %4743 = torch.aten.unsqueeze %4729, %int0_5885 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5886 = torch.constant.int 0 %int1_5887 = torch.constant.int 1 %4744 = torch.aten.select.int %4678, %int0_5886, %int1_5887 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5888 = torch.constant.int 0 %int0_5889 = torch.constant.int 0 %4745 = torch.aten.select.int %4744, %int0_5888, %int0_5889 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4746 = torch.prim.ListConstruct %4728, %4741, %4742, %4743 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5890 = torch.constant.bool false %4747 = torch.aten.index_put %4740, %4746, %4745, %false_5890 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5891 = torch.constant.int 2662400 %4748 = torch.prim.ListConstruct %731, %int2662400_5891 : (!torch.int, !torch.int) -> !torch.list %4749 = torch.aten.view %4747, %4748 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5892 = torch.constant.int -1 %int26_5893 = torch.constant.int 26 %int2_5894 = torch.constant.int 2 %int16_5895 = torch.constant.int 16 %int32_5896 = torch.constant.int 32 %int100_5897 = torch.constant.int 100 %4750 = torch.prim.ListConstruct %int-1_5892, %int26_5893, %int2_5894, %int16_5895, %int32_5896, %int100_5897 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4751 = torch.aten.view %4749, %4750 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_5898 = torch.constant.int 0 %int2_5899 = torch.constant.int 2 %4752 = torch.aten.select.int %4693, %int0_5898, %int2_5899 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5900 = torch.constant.int 0 %int2_5901 = torch.constant.int 2 %4753 = torch.aten.select.int %arg3, %int0_5900, %int2_5901 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5902 = torch.constant.int 0 %int0_5903 = torch.constant.int 0 %int9223372036854775807_5904 = torch.constant.int 9223372036854775807 %int1_5905 = torch.constant.int 1 %4754 = torch.aten.slice.Tensor %4753, %int0_5902, %int0_5903, %int9223372036854775807_5904, %int1_5905 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5906 = torch.constant.int 16 %4755 = torch.aten.floor_divide.Scalar %4752, %int16_5906 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5907 = torch.constant.int 0 %4756 = torch.aten.index_select %4754, %int0_5907, %4755 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5908 = torch.constant.int 16 %4757 = torch.aten.remainder.Scalar %4752, %int16_5908 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5909 = torch.constant.none %4758 = torch.aten.clone %486, %none_5909 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5910 = torch.constant.none %4759 = torch.aten.clone %487, %none_5910 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5911 = torch.constant.int 0 %4760 = torch.aten.unsqueeze %4757, %int0_5911 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5912 = torch.constant.int 0 %int2_5913 = torch.constant.int 2 %4761 = torch.aten.select.int %4692, %int0_5912, %int2_5913 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5914 = torch.constant.int 0 %int0_5915 = torch.constant.int 0 %4762 = torch.aten.select.int %4761, %int0_5914, %int0_5915 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4763 = torch.prim.ListConstruct %4756, %4758, %4759, %4760 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5916 = torch.constant.bool false %4764 = torch.aten.index_put %4751, %4763, %4762, %false_5916 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5917 = torch.constant.int 2662400 %4765 = torch.prim.ListConstruct %731, %int2662400_5917 : (!torch.int, !torch.int) -> !torch.list %4766 = torch.aten.view %4764, %4765 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5918 = torch.constant.int -1 %int26_5919 = torch.constant.int 26 %int2_5920 = torch.constant.int 2 %int16_5921 = torch.constant.int 16 %int32_5922 = torch.constant.int 32 %int100_5923 = torch.constant.int 100 %4767 = torch.prim.ListConstruct %int-1_5918, %int26_5919, %int2_5920, %int16_5921, %int32_5922, %int100_5923 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4768 = torch.aten.view %4766, %4767 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5924 = torch.constant.none %4769 = torch.aten.clone %488, %none_5924 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5925 = torch.constant.none %4770 = torch.aten.clone %489, %none_5925 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5926 = torch.constant.int 0 %4771 = torch.aten.unsqueeze %4757, %int0_5926 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5927 = torch.constant.int 0 %int2_5928 = torch.constant.int 2 %4772 = torch.aten.select.int %4678, %int0_5927, %int2_5928 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5929 = torch.constant.int 0 %int0_5930 = torch.constant.int 0 %4773 = torch.aten.select.int %4772, %int0_5929, %int0_5930 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4774 = torch.prim.ListConstruct %4756, %4769, %4770, %4771 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5931 = torch.constant.bool false %4775 = torch.aten.index_put %4768, %4774, %4773, %false_5931 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5932 = torch.constant.int 2662400 %4776 = torch.prim.ListConstruct %731, %int2662400_5932 : (!torch.int, !torch.int) -> !torch.list %4777 = torch.aten.view %4775, %4776 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5933 = torch.constant.int -1 %int26_5934 = torch.constant.int 26 %int2_5935 = torch.constant.int 2 %int16_5936 = torch.constant.int 16 %int32_5937 = torch.constant.int 32 %int100_5938 = torch.constant.int 100 %4778 = torch.prim.ListConstruct %int-1_5933, %int26_5934, %int2_5935, %int16_5936, %int32_5937, %int100_5938 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4779 = torch.aten.view %4777, %4778 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_5939 = torch.constant.int 0 %int3_5940 = torch.constant.int 3 %4780 = torch.aten.select.int %4693, %int0_5939, %int3_5940 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_5941 = torch.constant.int 0 %int3_5942 = torch.constant.int 3 %4781 = torch.aten.select.int %arg3, %int0_5941, %int3_5942 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_5943 = torch.constant.int 0 %int0_5944 = torch.constant.int 0 %int9223372036854775807_5945 = torch.constant.int 9223372036854775807 %int1_5946 = torch.constant.int 1 %4782 = torch.aten.slice.Tensor %4781, %int0_5943, %int0_5944, %int9223372036854775807_5945, %int1_5946 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_5947 = torch.constant.int 16 %4783 = torch.aten.floor_divide.Scalar %4780, %int16_5947 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_5948 = torch.constant.int 0 %4784 = torch.aten.index_select %4782, %int0_5948, %4783 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_5949 = torch.constant.int 16 %4785 = torch.aten.remainder.Scalar %4780, %int16_5949 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_5950 = torch.constant.none %4786 = torch.aten.clone %490, %none_5950 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5951 = torch.constant.none %4787 = torch.aten.clone %491, %none_5951 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5952 = torch.constant.int 0 %4788 = torch.aten.unsqueeze %4785, %int0_5952 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5953 = torch.constant.int 0 %int3_5954 = torch.constant.int 3 %4789 = torch.aten.select.int %4692, %int0_5953, %int3_5954 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5955 = torch.constant.int 0 %int0_5956 = torch.constant.int 0 %4790 = torch.aten.select.int %4789, %int0_5955, %int0_5956 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4791 = torch.prim.ListConstruct %4784, %4786, %4787, %4788 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5957 = torch.constant.bool false %4792 = torch.aten.index_put %4779, %4791, %4790, %false_5957 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5958 = torch.constant.int 2662400 %4793 = torch.prim.ListConstruct %731, %int2662400_5958 : (!torch.int, !torch.int) -> !torch.list %4794 = torch.aten.view %4792, %4793 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_5959 = torch.constant.int -1 %int26_5960 = torch.constant.int 26 %int2_5961 = torch.constant.int 2 %int16_5962 = torch.constant.int 16 %int32_5963 = torch.constant.int 32 %int100_5964 = torch.constant.int 100 %4795 = torch.prim.ListConstruct %int-1_5959, %int26_5960, %int2_5961, %int16_5962, %int32_5963, %int100_5964 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4796 = torch.aten.view %4794, %4795 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_5965 = torch.constant.none %4797 = torch.aten.clone %492, %none_5965 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_5966 = torch.constant.none %4798 = torch.aten.clone %493, %none_5966 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_5967 = torch.constant.int 0 %4799 = torch.aten.unsqueeze %4785, %int0_5967 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_5968 = torch.constant.int 0 %int3_5969 = torch.constant.int 3 %4800 = torch.aten.select.int %4678, %int0_5968, %int3_5969 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_5970 = torch.constant.int 0 %int0_5971 = torch.constant.int 0 %4801 = torch.aten.select.int %4800, %int0_5970, %int0_5971 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4802 = torch.prim.ListConstruct %4784, %4797, %4798, %4799 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_5972 = torch.constant.bool false %4803 = torch.aten.index_put %4796, %4802, %4801, %false_5972 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_5973 = torch.constant.int 2662400 %4804 = torch.prim.ListConstruct %731, %int2662400_5973 : (!torch.int, !torch.int) -> !torch.list %4805 = torch.aten.view %4803, %4804 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_5974 = torch.constant.int 52 %4806 = torch.aten.mul.Scalar %arg3, %int52_5974 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int30 = torch.constant.int 30 %int1_5975 = torch.constant.int 1 %4807 = torch.aten.add.Scalar %4806, %int30, %int1_5975 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_5976 = torch.constant.int 4 %4808 = torch.aten.mul.int %int4_5976, %655 : !torch.int, !torch.int -> !torch.int %4809 = torch.prim.ListConstruct %4808 : (!torch.int) -> !torch.list %4810 = torch.aten.view %4807, %4809 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_5977 = torch.constant.int -1 %int26_5978 = torch.constant.int 26 %int2_5979 = torch.constant.int 2 %int16_5980 = torch.constant.int 16 %int32_5981 = torch.constant.int 32 %int100_5982 = torch.constant.int 100 %4811 = torch.prim.ListConstruct %int-1_5977, %int26_5978, %int2_5979, %int16_5980, %int32_5981, %int100_5982 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4812 = torch.aten.view %4805, %4811 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_5983 = torch.constant.int 26 %4813 = torch.aten.mul.int %731, %int26_5983 : !torch.int, !torch.int -> !torch.int %int2_5984 = torch.constant.int 2 %4814 = torch.aten.mul.int %4813, %int2_5984 : !torch.int, !torch.int -> !torch.int %int16_5985 = torch.constant.int 16 %int32_5986 = torch.constant.int 32 %int100_5987 = torch.constant.int 100 %4815 = torch.prim.ListConstruct %4814, %int16_5985, %int32_5986, %int100_5987 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4816 = torch.aten.view %4812, %4815 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_5988 = torch.constant.int 0 %4817 = torch.aten.index_select %4816, %int0_5988, %4810 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_5989 = torch.constant.int 4 %int16_5990 = torch.constant.int 16 %int32_5991 = torch.constant.int 32 %int100_5992 = torch.constant.int 100 %4818 = torch.prim.ListConstruct %int4_5989, %655, %int16_5990, %int32_5991, %int100_5992 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4819 = torch.aten.view %4817, %4818 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_5993 = torch.constant.int 1 %4820 = torch.aten.size.int %4819, %int1_5993 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_5994 = torch.constant.int 16 %4821 = torch.aten.mul.int %4820, %int16_5994 : !torch.int, !torch.int -> !torch.int %int4_5995 = torch.constant.int 4 %int32_5996 = torch.constant.int 32 %int100_5997 = torch.constant.int 100 %4822 = torch.prim.ListConstruct %int4_5995, %4821, %int32_5996, %int100_5997 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4823 = torch.aten.view %4819, %4822 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_5998 = torch.constant.int 0 %int0_5999 = torch.constant.int 0 %int9223372036854775807_6000 = torch.constant.int 9223372036854775807 %int1_6001 = torch.constant.int 1 %4824 = torch.aten.slice.Tensor %4565, %int0_5998, %int0_5999, %int9223372036854775807_6000, %int1_6001 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_6002 = torch.constant.int 16 %4825 = torch.aten.mul.int %655, %int16_6002 : !torch.int, !torch.int -> !torch.int %int1_6003 = torch.constant.int 1 %int0_6004 = torch.constant.int 0 %int1_6005 = torch.constant.int 1 %4826 = torch.aten.slice.Tensor %4824, %int1_6003, %int0_6004, %4825, %int1_6005 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_6006 = torch.constant.bool false %4827 = torch.aten.copy %4826, %4823, %false_6006 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_6007 = torch.constant.int 0 %int0_6008 = torch.constant.int 0 %int9223372036854775807_6009 = torch.constant.int 9223372036854775807 %int1_6010 = torch.constant.int 1 %4828 = torch.aten.slice.Tensor %4565, %int0_6007, %int0_6008, %int9223372036854775807_6009, %int1_6010 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6011 = torch.constant.int 1 %int0_6012 = torch.constant.int 0 %int1_6013 = torch.constant.int 1 %4829 = torch.aten.slice_scatter %4828, %4827, %int1_6011, %int0_6012, %4825, %int1_6013 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_6014 = torch.constant.int 0 %int0_6015 = torch.constant.int 0 %int9223372036854775807_6016 = torch.constant.int 9223372036854775807 %int1_6017 = torch.constant.int 1 %4830 = torch.aten.slice_scatter %4565, %4829, %int0_6014, %int0_6015, %int9223372036854775807_6016, %int1_6017 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6018 = torch.constant.int 1 %int1_6019 = torch.constant.int 1 %4831 = torch.aten.add.Scalar %4807, %int1_6018, %int1_6019 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_6020 = torch.constant.int 4 %4832 = torch.aten.mul.int %int4_6020, %655 : !torch.int, !torch.int -> !torch.int %4833 = torch.prim.ListConstruct %4832 : (!torch.int) -> !torch.list %4834 = torch.aten.view %4831, %4833 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_6021 = torch.constant.int 0 %4835 = torch.aten.index_select %4816, %int0_6021, %4834 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_6022 = torch.constant.int 4 %int16_6023 = torch.constant.int 16 %int32_6024 = torch.constant.int 32 %int100_6025 = torch.constant.int 100 %4836 = torch.prim.ListConstruct %int4_6022, %655, %int16_6023, %int32_6024, %int100_6025 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4837 = torch.aten.view %4835, %4836 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_6026 = torch.constant.int 1 %4838 = torch.aten.size.int %4837, %int1_6026 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_6027 = torch.constant.int 16 %4839 = torch.aten.mul.int %4838, %int16_6027 : !torch.int, !torch.int -> !torch.int %int4_6028 = torch.constant.int 4 %int32_6029 = torch.constant.int 32 %int100_6030 = torch.constant.int 100 %4840 = torch.prim.ListConstruct %int4_6028, %4839, %int32_6029, %int100_6030 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4841 = torch.aten.view %4837, %4840 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_6031 = torch.constant.int 0 %int0_6032 = torch.constant.int 0 %int9223372036854775807_6033 = torch.constant.int 9223372036854775807 %int1_6034 = torch.constant.int 1 %4842 = torch.aten.slice.Tensor %4582, %int0_6031, %int0_6032, %int9223372036854775807_6033, %int1_6034 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6035 = torch.constant.int 1 %int0_6036 = torch.constant.int 0 %int1_6037 = torch.constant.int 1 %4843 = torch.aten.slice.Tensor %4842, %int1_6035, %int0_6036, %4825, %int1_6037 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_6038 = torch.constant.bool false %4844 = torch.aten.copy %4843, %4841, %false_6038 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_6039 = torch.constant.int 0 %int0_6040 = torch.constant.int 0 %int9223372036854775807_6041 = torch.constant.int 9223372036854775807 %int1_6042 = torch.constant.int 1 %4845 = torch.aten.slice.Tensor %4582, %int0_6039, %int0_6040, %int9223372036854775807_6041, %int1_6042 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6043 = torch.constant.int 1 %int0_6044 = torch.constant.int 0 %int1_6045 = torch.constant.int 1 %4846 = torch.aten.slice_scatter %4845, %4844, %int1_6043, %int0_6044, %4825, %int1_6045 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_6046 = torch.constant.int 0 %int0_6047 = torch.constant.int 0 %int9223372036854775807_6048 = torch.constant.int 9223372036854775807 %int1_6049 = torch.constant.int 1 %4847 = torch.aten.slice_scatter %4582, %4846, %int0_6046, %int0_6047, %int9223372036854775807_6048, %int1_6049 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_6050 = torch.constant.int 0 %int0_6051 = torch.constant.int 0 %int9223372036854775807_6052 = torch.constant.int 9223372036854775807 %int1_6053 = torch.constant.int 1 %4848 = torch.aten.slice.Tensor %671, %int0_6050, %int0_6051, %int9223372036854775807_6052, %int1_6053 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6054 = torch.constant.int 1 %int0_6055 = torch.constant.int 0 %int1_6056 = torch.constant.int 1 %4849 = torch.aten.slice.Tensor %4848, %int1_6054, %int0_6055, %4825, %int1_6056 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_6057 = torch.constant.int 0 %int0_6058 = torch.constant.int 0 %int9223372036854775807_6059 = torch.constant.int 9223372036854775807 %int1_6060 = torch.constant.int 1 %4850 = torch.aten.slice.Tensor %673, %int0_6057, %int0_6058, %int9223372036854775807_6059, %int1_6060 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6061 = torch.constant.int 1 %int0_6062 = torch.constant.int 0 %int1_6063 = torch.constant.int 1 %4851 = torch.aten.slice.Tensor %4850, %int1_6061, %int0_6062, %4825, %int1_6063 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_6064 = torch.constant.int 1 %int2_6065 = torch.constant.int 2 %4852 = torch.aten.transpose.int %4688, %int1_6064, %int2_6065 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_6066 = torch.constant.int 4 %int32_6067 = torch.constant.int 32 %int1_6068 = torch.constant.int 1 %int100_6069 = torch.constant.int 100 %4853 = torch.prim.ListConstruct %int4_6066, %int32_6067, %int1_6068, %int100_6069 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6070 = torch.constant.bool false %4854 = torch.aten.expand %4852, %4853, %false_6070 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_6071 = torch.constant.int 128 %int1_6072 = torch.constant.int 1 %int100_6073 = torch.constant.int 100 %4855 = torch.prim.ListConstruct %int128_6071, %int1_6072, %int100_6073 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4856 = torch.aten.view %4854, %4855 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_6074 = torch.constant.int 0 %int0_6075 = torch.constant.int 0 %int9223372036854775807_6076 = torch.constant.int 9223372036854775807 %int1_6077 = torch.constant.int 1 %4857 = torch.aten.slice.Tensor %4830, %int0_6074, %int0_6075, %int9223372036854775807_6076, %int1_6077 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6078 = torch.constant.int 1 %int0_6079 = torch.constant.int 0 %int1_6080 = torch.constant.int 1 %4858 = torch.aten.slice.Tensor %4857, %int1_6078, %int0_6079, %4825, %int1_6080 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_6081 = torch.constant.int 1 %int2_6082 = torch.constant.int 2 %4859 = torch.aten.transpose.int %4858, %int1_6081, %int2_6082 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_6083 = torch.constant.int 2 %int3_6084 = torch.constant.int 3 %4860 = torch.aten.transpose.int %4859, %int2_6083, %int3_6084 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_6085 = torch.constant.int 1 %4861 = torch.aten.size.int %4849, %int1_6085 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_6086 = torch.constant.int 4 %int32_6087 = torch.constant.int 32 %int100_6088 = torch.constant.int 100 %4862 = torch.prim.ListConstruct %int4_6086, %int32_6087, %int100_6088, %4861 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6089 = torch.constant.bool false %4863 = torch.aten.expand %4860, %4862, %false_6089 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_6090 = torch.constant.int 0 %4864 = torch.aten.clone %4863, %int0_6090 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_6091 = torch.constant.int 128 %int100_6092 = torch.constant.int 100 %4865 = torch.prim.ListConstruct %int128_6091, %int100_6092, %4861 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4866 = torch.aten._unsafe_view %4864, %4865 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %4867 = torch.aten.bmm %4856, %4866 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_6093 = torch.constant.int 4 %int32_6094 = torch.constant.int 32 %int1_6095 = torch.constant.int 1 %4868 = torch.prim.ListConstruct %int4_6093, %int32_6094, %int1_6095, %4861 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4869 = torch.aten.view %4867, %4868 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_6096 = torch.constant.float 1.000000e+01 %4870 = torch.aten.div.Scalar %4869, %float1.000000e01_6096 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_6097 = torch.constant.int 1 %4871 = torch.aten.add.Tensor %4870, %895, %int1_6097 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_6098 = torch.constant.int -1 %false_6099 = torch.constant.bool false %4872 = torch.aten._softmax %4871, %int-1_6098, %false_6099 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_6100 = torch.constant.int 4 %int32_6101 = torch.constant.int 32 %int1_6102 = torch.constant.int 1 %4873 = torch.prim.ListConstruct %int4_6100, %int32_6101, %int1_6102, %4861 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6103 = torch.constant.bool false %4874 = torch.aten.expand %4872, %4873, %false_6103 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_6104 = torch.constant.int 128 %int1_6105 = torch.constant.int 1 %4875 = torch.prim.ListConstruct %int128_6104, %int1_6105, %4861 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4876 = torch.aten.view %4874, %4875 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_6106 = torch.constant.int 0 %int0_6107 = torch.constant.int 0 %int9223372036854775807_6108 = torch.constant.int 9223372036854775807 %int1_6109 = torch.constant.int 1 %4877 = torch.aten.slice.Tensor %4847, %int0_6106, %int0_6107, %int9223372036854775807_6108, %int1_6109 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6110 = torch.constant.int 1 %int0_6111 = torch.constant.int 0 %int1_6112 = torch.constant.int 1 %4878 = torch.aten.slice.Tensor %4877, %int1_6110, %int0_6111, %4825, %int1_6112 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_6113 = torch.constant.int 1 %int2_6114 = torch.constant.int 2 %4879 = torch.aten.transpose.int %4878, %int1_6113, %int2_6114 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_6115 = torch.constant.int 1 %4880 = torch.aten.size.int %4851, %int1_6115 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_6116 = torch.constant.int 4 %int32_6117 = torch.constant.int 32 %int100_6118 = torch.constant.int 100 %4881 = torch.prim.ListConstruct %int4_6116, %int32_6117, %4880, %int100_6118 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6119 = torch.constant.bool false %4882 = torch.aten.expand %4879, %4881, %false_6119 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_6120 = torch.constant.int 0 %4883 = torch.aten.clone %4882, %int0_6120 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_6121 = torch.constant.int 128 %int100_6122 = torch.constant.int 100 %4884 = torch.prim.ListConstruct %int128_6121, %4880, %int100_6122 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4885 = torch.aten._unsafe_view %4883, %4884 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %4886 = torch.aten.bmm %4876, %4885 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_6123 = torch.constant.int 4 %int32_6124 = torch.constant.int 32 %int1_6125 = torch.constant.int 1 %int100_6126 = torch.constant.int 100 %4887 = torch.prim.ListConstruct %int4_6123, %int32_6124, %int1_6125, %int100_6126 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4888 = torch.aten.view %4886, %4887 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_6127 = torch.constant.int 1 %int2_6128 = torch.constant.int 2 %4889 = torch.aten.transpose.int %4888, %int1_6127, %int2_6128 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_6129 = torch.constant.int 4 %int1_6130 = torch.constant.int 1 %int-1_6131 = torch.constant.int -1 %4890 = torch.prim.ListConstruct %int4_6129, %int1_6130, %int-1_6131 : (!torch.int, !torch.int, !torch.int) -> !torch.list %4891 = torch.aten.view %4889, %4890 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %4892 = torch_c.to_builtin_tensor %4891 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6132 = tensor.cast %4892 : tensor<4x1x3200xf32> to tensor %4893 = torch_c.to_builtin_tensor %141 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4894 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6132, %4893) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6133 = tensor.cast %4894 : tensor to tensor<4x1x3200xf32> %4895 = torch_c.from_builtin_tensor %cast_6133 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_6134 = torch.constant.int 1 %4896 = torch.aten.add.Tensor %4653, %4895, %int1_6134 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_6135 = torch.constant.int 2 %4897 = torch.aten.pow.Tensor_Scalar %4896, %int2_6135 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_6136 = torch.constant.int -1 %4898 = torch.prim.ListConstruct %int-1_6136 : (!torch.int) -> !torch.list %true_6137 = torch.constant.bool true %none_6138 = torch.constant.none %4899 = torch.aten.mean.dim %4897, %4898, %true_6137, %none_6138 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_6139 = torch.constant.float 9.9999999747524271E-7 %int1_6140 = torch.constant.int 1 %4900 = torch.aten.add.Scalar %4899, %float9.999990e-07_6139, %int1_6140 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %4901 = torch.aten.rsqrt %4900 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %4902 = torch.aten.mul.Tensor %4896, %4901 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %4903 = torch.aten.mul.Tensor %4902, %142 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %4904 = torch_c.to_builtin_tensor %4903 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6141 = tensor.cast %4904 : tensor<4x1x3200xf32> to tensor %4905 = torch_c.to_builtin_tensor %143 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %4906 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_6141, %4905) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_6142 = tensor.cast %4906 : tensor to tensor<4x1x8640xf32> %4907 = torch_c.from_builtin_tensor %cast_6142 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %4908 = torch.aten.silu %4907 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %4909 = torch_c.to_builtin_tensor %4903 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6143 = tensor.cast %4909 : tensor<4x1x3200xf32> to tensor %4910 = torch_c.to_builtin_tensor %144 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %4911 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_6143, %4910) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_6144 = tensor.cast %4911 : tensor to tensor<4x1x8640xf32> %4912 = torch_c.from_builtin_tensor %cast_6144 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %4913 = torch.aten.mul.Tensor %4908, %4912 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %4914 = torch_c.to_builtin_tensor %4913 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_6145 = tensor.cast %4914 : tensor<4x1x8640xf32> to tensor %4915 = torch_c.to_builtin_tensor %145 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %4916 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_6145, %4915) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_6146 = tensor.cast %4916 : tensor to tensor<4x1x3200xf32> %4917 = torch_c.from_builtin_tensor %cast_6146 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_6147 = torch.constant.int 1 %4918 = torch.aten.add.Tensor %4896, %4917, %int1_6147 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_6148 = torch.constant.int 2 %4919 = torch.aten.pow.Tensor_Scalar %4918, %int2_6148 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_6149 = torch.constant.int -1 %4920 = torch.prim.ListConstruct %int-1_6149 : (!torch.int) -> !torch.list %true_6150 = torch.constant.bool true %none_6151 = torch.constant.none %4921 = torch.aten.mean.dim %4919, %4920, %true_6150, %none_6151 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_6152 = torch.constant.float 9.9999999747524271E-7 %int1_6153 = torch.constant.int 1 %4922 = torch.aten.add.Scalar %4921, %float9.999990e-07_6152, %int1_6153 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %4923 = torch.aten.rsqrt %4922 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %4924 = torch.aten.mul.Tensor %4918, %4923 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %4925 = torch.aten.mul.Tensor %4924, %146 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %4926 = torch_c.to_builtin_tensor %4925 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6154 = tensor.cast %4926 : tensor<4x1x3200xf32> to tensor %4927 = torch_c.to_builtin_tensor %147 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4928 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6154, %4927) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6155 = tensor.cast %4928 : tensor to tensor<4x1x3200xf32> %4929 = torch_c.from_builtin_tensor %cast_6155 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %4930 = torch_c.to_builtin_tensor %4925 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6156 = tensor.cast %4930 : tensor<4x1x3200xf32> to tensor %4931 = torch_c.to_builtin_tensor %148 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4932 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6156, %4931) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6157 = tensor.cast %4932 : tensor to tensor<4x1x3200xf32> %4933 = torch_c.from_builtin_tensor %cast_6157 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %4934 = torch_c.to_builtin_tensor %4925 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6158 = tensor.cast %4934 : tensor<4x1x3200xf32> to tensor %4935 = torch_c.to_builtin_tensor %149 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %4936 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6158, %4935) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6159 = tensor.cast %4936 : tensor to tensor<4x1x3200xf32> %4937 = torch_c.from_builtin_tensor %cast_6159 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_6160 = torch.constant.int 4 %int1_6161 = torch.constant.int 1 %int32_6162 = torch.constant.int 32 %int100_6163 = torch.constant.int 100 %4938 = torch.prim.ListConstruct %int4_6160, %int1_6161, %int32_6162, %int100_6163 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4939 = torch.aten.view %4929, %4938 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_6164 = torch.constant.int 4 %int1_6165 = torch.constant.int 1 %int32_6166 = torch.constant.int 32 %int100_6167 = torch.constant.int 100 %4940 = torch.prim.ListConstruct %int4_6164, %int1_6165, %int32_6166, %int100_6167 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4941 = torch.aten.view %4933, %4940 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_6168 = torch.constant.int 4 %int1_6169 = torch.constant.int 1 %int32_6170 = torch.constant.int 32 %int100_6171 = torch.constant.int 100 %4942 = torch.prim.ListConstruct %int4_6168, %int1_6169, %int32_6170, %int100_6171 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4943 = torch.aten.view %4937, %4942 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_6172 = torch.constant.int 4 %int1_6173 = torch.constant.int 1 %int32_6174 = torch.constant.int 32 %int-1_6175 = torch.constant.int -1 %int2_6176 = torch.constant.int 2 %4944 = torch.prim.ListConstruct %int4_6172, %int1_6173, %int32_6174, %int-1_6175, %int2_6176 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4945 = torch.aten.view %4939, %4944 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %4946 = torch.aten.view_as_complex %4945 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_6177 = torch.constant.int 4 %int1_6178 = torch.constant.int 1 %int32_6179 = torch.constant.int 32 %int-1_6180 = torch.constant.int -1 %int2_6181 = torch.constant.int 2 %4947 = torch.prim.ListConstruct %int4_6177, %int1_6178, %int32_6179, %int-1_6180, %int2_6181 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4948 = torch.aten.view %4941, %4947 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %4949 = torch.aten.view_as_complex %4948 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %4950 = torch.aten.mul.Tensor %4946, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %4951 = torch.aten.view_as_real %4950 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_6182 = torch.constant.int 4 %int1_6183 = torch.constant.int 1 %int32_6184 = torch.constant.int 32 %int100_6185 = torch.constant.int 100 %4952 = torch.prim.ListConstruct %int4_6182, %int1_6183, %int32_6184, %int100_6185 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4953 = torch.aten.view %4951, %4952 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %4954 = torch.aten.mul.Tensor %4949, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %4955 = torch.aten.view_as_real %4954 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_6186 = torch.constant.int 4 %int1_6187 = torch.constant.int 1 %int32_6188 = torch.constant.int 32 %int100_6189 = torch.constant.int 100 %4956 = torch.prim.ListConstruct %int4_6186, %int1_6187, %int32_6188, %int100_6189 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4957 = torch.aten.view %4955, %4956 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_6190 = torch.constant.int 1 %int1_6191 = torch.constant.int 1 %4958 = torch.aten.add.Scalar %arg2, %int1_6190, %int1_6191 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_6192 = torch.constant.int 0 %int0_6193 = torch.constant.int 0 %4959 = torch.aten.select.int %4958, %int0_6192, %int0_6193 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_6194 = torch.constant.int 0 %int0_6195 = torch.constant.int 0 %4960 = torch.aten.select.int %arg3, %int0_6194, %int0_6195 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_6196 = torch.constant.int 0 %int0_6197 = torch.constant.int 0 %int9223372036854775807_6198 = torch.constant.int 9223372036854775807 %int1_6199 = torch.constant.int 1 %4961 = torch.aten.slice.Tensor %4960, %int0_6196, %int0_6197, %int9223372036854775807_6198, %int1_6199 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_6200 = torch.constant.int 16 %4962 = torch.aten.floor_divide.Scalar %4959, %int16_6200 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_6201 = torch.constant.int 0 %4963 = torch.aten.index_select %4961, %int0_6201, %4962 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_6202 = torch.constant.int 16 %4964 = torch.aten.remainder.Scalar %4959, %int16_6202 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_6203 = torch.constant.none %4965 = torch.aten.clone %494, %none_6203 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6204 = torch.constant.none %4966 = torch.aten.clone %495, %none_6204 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6205 = torch.constant.int 0 %4967 = torch.aten.unsqueeze %4964, %int0_6205 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6206 = torch.constant.int 0 %int0_6207 = torch.constant.int 0 %4968 = torch.aten.select.int %4957, %int0_6206, %int0_6207 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6208 = torch.constant.int 0 %int0_6209 = torch.constant.int 0 %4969 = torch.aten.select.int %4968, %int0_6208, %int0_6209 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_6210 = torch.constant.int -1 %int26_6211 = torch.constant.int 26 %int2_6212 = torch.constant.int 2 %int16_6213 = torch.constant.int 16 %int32_6214 = torch.constant.int 32 %int100_6215 = torch.constant.int 100 %4970 = torch.prim.ListConstruct %int-1_6210, %int26_6211, %int2_6212, %int16_6213, %int32_6214, %int100_6215 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4971 = torch.aten.view %4805, %4970 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %4972 = torch.prim.ListConstruct %4963, %4965, %4966, %4967 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6216 = torch.constant.bool false %4973 = torch.aten.index_put %4971, %4972, %4969, %false_6216 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6217 = torch.constant.int 2662400 %4974 = torch.prim.ListConstruct %731, %int2662400_6217 : (!torch.int, !torch.int) -> !torch.list %4975 = torch.aten.view %4973, %4974 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6218 = torch.constant.int -1 %int26_6219 = torch.constant.int 26 %int2_6220 = torch.constant.int 2 %int16_6221 = torch.constant.int 16 %int32_6222 = torch.constant.int 32 %int100_6223 = torch.constant.int 100 %4976 = torch.prim.ListConstruct %int-1_6218, %int26_6219, %int2_6220, %int16_6221, %int32_6222, %int100_6223 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4977 = torch.aten.view %4975, %4976 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_6224 = torch.constant.none %4978 = torch.aten.clone %496, %none_6224 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6225 = torch.constant.none %4979 = torch.aten.clone %497, %none_6225 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6226 = torch.constant.int 0 %4980 = torch.aten.unsqueeze %4964, %int0_6226 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6227 = torch.constant.int 0 %int0_6228 = torch.constant.int 0 %4981 = torch.aten.select.int %4943, %int0_6227, %int0_6228 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6229 = torch.constant.int 0 %int0_6230 = torch.constant.int 0 %4982 = torch.aten.select.int %4981, %int0_6229, %int0_6230 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %4983 = torch.prim.ListConstruct %4963, %4978, %4979, %4980 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6231 = torch.constant.bool false %4984 = torch.aten.index_put %4977, %4983, %4982, %false_6231 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6232 = torch.constant.int 2662400 %4985 = torch.prim.ListConstruct %731, %int2662400_6232 : (!torch.int, !torch.int) -> !torch.list %4986 = torch.aten.view %4984, %4985 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6233 = torch.constant.int -1 %int26_6234 = torch.constant.int 26 %int2_6235 = torch.constant.int 2 %int16_6236 = torch.constant.int 16 %int32_6237 = torch.constant.int 32 %int100_6238 = torch.constant.int 100 %4987 = torch.prim.ListConstruct %int-1_6233, %int26_6234, %int2_6235, %int16_6236, %int32_6237, %int100_6238 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %4988 = torch.aten.view %4986, %4987 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_6239 = torch.constant.int 0 %int1_6240 = torch.constant.int 1 %4989 = torch.aten.select.int %4958, %int0_6239, %int1_6240 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_6241 = torch.constant.int 0 %int1_6242 = torch.constant.int 1 %4990 = torch.aten.select.int %arg3, %int0_6241, %int1_6242 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_6243 = torch.constant.int 0 %int0_6244 = torch.constant.int 0 %int9223372036854775807_6245 = torch.constant.int 9223372036854775807 %int1_6246 = torch.constant.int 1 %4991 = torch.aten.slice.Tensor %4990, %int0_6243, %int0_6244, %int9223372036854775807_6245, %int1_6246 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_6247 = torch.constant.int 16 %4992 = torch.aten.floor_divide.Scalar %4989, %int16_6247 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_6248 = torch.constant.int 0 %4993 = torch.aten.index_select %4991, %int0_6248, %4992 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_6249 = torch.constant.int 16 %4994 = torch.aten.remainder.Scalar %4989, %int16_6249 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_6250 = torch.constant.none %4995 = torch.aten.clone %498, %none_6250 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6251 = torch.constant.none %4996 = torch.aten.clone %499, %none_6251 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6252 = torch.constant.int 0 %4997 = torch.aten.unsqueeze %4994, %int0_6252 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6253 = torch.constant.int 0 %int1_6254 = torch.constant.int 1 %4998 = torch.aten.select.int %4957, %int0_6253, %int1_6254 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6255 = torch.constant.int 0 %int0_6256 = torch.constant.int 0 %4999 = torch.aten.select.int %4998, %int0_6255, %int0_6256 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5000 = torch.prim.ListConstruct %4993, %4995, %4996, %4997 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6257 = torch.constant.bool false %5001 = torch.aten.index_put %4988, %5000, %4999, %false_6257 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6258 = torch.constant.int 2662400 %5002 = torch.prim.ListConstruct %731, %int2662400_6258 : (!torch.int, !torch.int) -> !torch.list %5003 = torch.aten.view %5001, %5002 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6259 = torch.constant.int -1 %int26_6260 = torch.constant.int 26 %int2_6261 = torch.constant.int 2 %int16_6262 = torch.constant.int 16 %int32_6263 = torch.constant.int 32 %int100_6264 = torch.constant.int 100 %5004 = torch.prim.ListConstruct %int-1_6259, %int26_6260, %int2_6261, %int16_6262, %int32_6263, %int100_6264 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5005 = torch.aten.view %5003, %5004 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_6265 = torch.constant.none %5006 = torch.aten.clone %500, %none_6265 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6266 = torch.constant.none %5007 = torch.aten.clone %501, %none_6266 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6267 = torch.constant.int 0 %5008 = torch.aten.unsqueeze %4994, %int0_6267 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6268 = torch.constant.int 0 %int1_6269 = torch.constant.int 1 %5009 = torch.aten.select.int %4943, %int0_6268, %int1_6269 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6270 = torch.constant.int 0 %int0_6271 = torch.constant.int 0 %5010 = torch.aten.select.int %5009, %int0_6270, %int0_6271 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5011 = torch.prim.ListConstruct %4993, %5006, %5007, %5008 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6272 = torch.constant.bool false %5012 = torch.aten.index_put %5005, %5011, %5010, %false_6272 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6273 = torch.constant.int 2662400 %5013 = torch.prim.ListConstruct %731, %int2662400_6273 : (!torch.int, !torch.int) -> !torch.list %5014 = torch.aten.view %5012, %5013 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6274 = torch.constant.int -1 %int26_6275 = torch.constant.int 26 %int2_6276 = torch.constant.int 2 %int16_6277 = torch.constant.int 16 %int32_6278 = torch.constant.int 32 %int100_6279 = torch.constant.int 100 %5015 = torch.prim.ListConstruct %int-1_6274, %int26_6275, %int2_6276, %int16_6277, %int32_6278, %int100_6279 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5016 = torch.aten.view %5014, %5015 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_6280 = torch.constant.int 0 %int2_6281 = torch.constant.int 2 %5017 = torch.aten.select.int %4958, %int0_6280, %int2_6281 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_6282 = torch.constant.int 0 %int2_6283 = torch.constant.int 2 %5018 = torch.aten.select.int %arg3, %int0_6282, %int2_6283 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_6284 = torch.constant.int 0 %int0_6285 = torch.constant.int 0 %int9223372036854775807_6286 = torch.constant.int 9223372036854775807 %int1_6287 = torch.constant.int 1 %5019 = torch.aten.slice.Tensor %5018, %int0_6284, %int0_6285, %int9223372036854775807_6286, %int1_6287 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_6288 = torch.constant.int 16 %5020 = torch.aten.floor_divide.Scalar %5017, %int16_6288 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_6289 = torch.constant.int 0 %5021 = torch.aten.index_select %5019, %int0_6289, %5020 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_6290 = torch.constant.int 16 %5022 = torch.aten.remainder.Scalar %5017, %int16_6290 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_6291 = torch.constant.none %5023 = torch.aten.clone %502, %none_6291 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6292 = torch.constant.none %5024 = torch.aten.clone %503, %none_6292 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6293 = torch.constant.int 0 %5025 = torch.aten.unsqueeze %5022, %int0_6293 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6294 = torch.constant.int 0 %int2_6295 = torch.constant.int 2 %5026 = torch.aten.select.int %4957, %int0_6294, %int2_6295 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6296 = torch.constant.int 0 %int0_6297 = torch.constant.int 0 %5027 = torch.aten.select.int %5026, %int0_6296, %int0_6297 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5028 = torch.prim.ListConstruct %5021, %5023, %5024, %5025 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6298 = torch.constant.bool false %5029 = torch.aten.index_put %5016, %5028, %5027, %false_6298 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6299 = torch.constant.int 2662400 %5030 = torch.prim.ListConstruct %731, %int2662400_6299 : (!torch.int, !torch.int) -> !torch.list %5031 = torch.aten.view %5029, %5030 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6300 = torch.constant.int -1 %int26_6301 = torch.constant.int 26 %int2_6302 = torch.constant.int 2 %int16_6303 = torch.constant.int 16 %int32_6304 = torch.constant.int 32 %int100_6305 = torch.constant.int 100 %5032 = torch.prim.ListConstruct %int-1_6300, %int26_6301, %int2_6302, %int16_6303, %int32_6304, %int100_6305 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5033 = torch.aten.view %5031, %5032 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_6306 = torch.constant.none %5034 = torch.aten.clone %504, %none_6306 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6307 = torch.constant.none %5035 = torch.aten.clone %505, %none_6307 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6308 = torch.constant.int 0 %5036 = torch.aten.unsqueeze %5022, %int0_6308 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6309 = torch.constant.int 0 %int2_6310 = torch.constant.int 2 %5037 = torch.aten.select.int %4943, %int0_6309, %int2_6310 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6311 = torch.constant.int 0 %int0_6312 = torch.constant.int 0 %5038 = torch.aten.select.int %5037, %int0_6311, %int0_6312 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5039 = torch.prim.ListConstruct %5021, %5034, %5035, %5036 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6313 = torch.constant.bool false %5040 = torch.aten.index_put %5033, %5039, %5038, %false_6313 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6314 = torch.constant.int 2662400 %5041 = torch.prim.ListConstruct %731, %int2662400_6314 : (!torch.int, !torch.int) -> !torch.list %5042 = torch.aten.view %5040, %5041 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6315 = torch.constant.int -1 %int26_6316 = torch.constant.int 26 %int2_6317 = torch.constant.int 2 %int16_6318 = torch.constant.int 16 %int32_6319 = torch.constant.int 32 %int100_6320 = torch.constant.int 100 %5043 = torch.prim.ListConstruct %int-1_6315, %int26_6316, %int2_6317, %int16_6318, %int32_6319, %int100_6320 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5044 = torch.aten.view %5042, %5043 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_6321 = torch.constant.int 0 %int3_6322 = torch.constant.int 3 %5045 = torch.aten.select.int %4958, %int0_6321, %int3_6322 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_6323 = torch.constant.int 0 %int3_6324 = torch.constant.int 3 %5046 = torch.aten.select.int %arg3, %int0_6323, %int3_6324 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_6325 = torch.constant.int 0 %int0_6326 = torch.constant.int 0 %int9223372036854775807_6327 = torch.constant.int 9223372036854775807 %int1_6328 = torch.constant.int 1 %5047 = torch.aten.slice.Tensor %5046, %int0_6325, %int0_6326, %int9223372036854775807_6327, %int1_6328 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_6329 = torch.constant.int 16 %5048 = torch.aten.floor_divide.Scalar %5045, %int16_6329 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_6330 = torch.constant.int 0 %5049 = torch.aten.index_select %5047, %int0_6330, %5048 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_6331 = torch.constant.int 16 %5050 = torch.aten.remainder.Scalar %5045, %int16_6331 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_6332 = torch.constant.none %5051 = torch.aten.clone %506, %none_6332 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6333 = torch.constant.none %5052 = torch.aten.clone %507, %none_6333 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6334 = torch.constant.int 0 %5053 = torch.aten.unsqueeze %5050, %int0_6334 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6335 = torch.constant.int 0 %int3_6336 = torch.constant.int 3 %5054 = torch.aten.select.int %4957, %int0_6335, %int3_6336 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6337 = torch.constant.int 0 %int0_6338 = torch.constant.int 0 %5055 = torch.aten.select.int %5054, %int0_6337, %int0_6338 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5056 = torch.prim.ListConstruct %5049, %5051, %5052, %5053 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6339 = torch.constant.bool false %5057 = torch.aten.index_put %5044, %5056, %5055, %false_6339 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6340 = torch.constant.int 2662400 %5058 = torch.prim.ListConstruct %731, %int2662400_6340 : (!torch.int, !torch.int) -> !torch.list %5059 = torch.aten.view %5057, %5058 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6341 = torch.constant.int -1 %int26_6342 = torch.constant.int 26 %int2_6343 = torch.constant.int 2 %int16_6344 = torch.constant.int 16 %int32_6345 = torch.constant.int 32 %int100_6346 = torch.constant.int 100 %5060 = torch.prim.ListConstruct %int-1_6341, %int26_6342, %int2_6343, %int16_6344, %int32_6345, %int100_6346 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5061 = torch.aten.view %5059, %5060 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_6347 = torch.constant.none %5062 = torch.aten.clone %508, %none_6347 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6348 = torch.constant.none %5063 = torch.aten.clone %509, %none_6348 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6349 = torch.constant.int 0 %5064 = torch.aten.unsqueeze %5050, %int0_6349 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6350 = torch.constant.int 0 %int3_6351 = torch.constant.int 3 %5065 = torch.aten.select.int %4943, %int0_6350, %int3_6351 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6352 = torch.constant.int 0 %int0_6353 = torch.constant.int 0 %5066 = torch.aten.select.int %5065, %int0_6352, %int0_6353 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5067 = torch.prim.ListConstruct %5049, %5062, %5063, %5064 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6354 = torch.constant.bool false %5068 = torch.aten.index_put %5061, %5067, %5066, %false_6354 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6355 = torch.constant.int 2662400 %5069 = torch.prim.ListConstruct %731, %int2662400_6355 : (!torch.int, !torch.int) -> !torch.list %5070 = torch.aten.view %5068, %5069 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_6356 = torch.constant.int 52 %5071 = torch.aten.mul.Scalar %arg3, %int52_6356 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int32_6357 = torch.constant.int 32 %int1_6358 = torch.constant.int 1 %5072 = torch.aten.add.Scalar %5071, %int32_6357, %int1_6358 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_6359 = torch.constant.int 4 %5073 = torch.aten.mul.int %int4_6359, %655 : !torch.int, !torch.int -> !torch.int %5074 = torch.prim.ListConstruct %5073 : (!torch.int) -> !torch.list %5075 = torch.aten.view %5072, %5074 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_6360 = torch.constant.int -1 %int26_6361 = torch.constant.int 26 %int2_6362 = torch.constant.int 2 %int16_6363 = torch.constant.int 16 %int32_6364 = torch.constant.int 32 %int100_6365 = torch.constant.int 100 %5076 = torch.prim.ListConstruct %int-1_6360, %int26_6361, %int2_6362, %int16_6363, %int32_6364, %int100_6365 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5077 = torch.aten.view %5070, %5076 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_6366 = torch.constant.int 26 %5078 = torch.aten.mul.int %731, %int26_6366 : !torch.int, !torch.int -> !torch.int %int2_6367 = torch.constant.int 2 %5079 = torch.aten.mul.int %5078, %int2_6367 : !torch.int, !torch.int -> !torch.int %int16_6368 = torch.constant.int 16 %int32_6369 = torch.constant.int 32 %int100_6370 = torch.constant.int 100 %5080 = torch.prim.ListConstruct %5079, %int16_6368, %int32_6369, %int100_6370 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5081 = torch.aten.view %5077, %5080 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_6371 = torch.constant.int 0 %5082 = torch.aten.index_select %5081, %int0_6371, %5075 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_6372 = torch.constant.int 4 %int16_6373 = torch.constant.int 16 %int32_6374 = torch.constant.int 32 %int100_6375 = torch.constant.int 100 %5083 = torch.prim.ListConstruct %int4_6372, %655, %int16_6373, %int32_6374, %int100_6375 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5084 = torch.aten.view %5082, %5083 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_6376 = torch.constant.int 1 %5085 = torch.aten.size.int %5084, %int1_6376 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_6377 = torch.constant.int 16 %5086 = torch.aten.mul.int %5085, %int16_6377 : !torch.int, !torch.int -> !torch.int %int4_6378 = torch.constant.int 4 %int32_6379 = torch.constant.int 32 %int100_6380 = torch.constant.int 100 %5087 = torch.prim.ListConstruct %int4_6378, %5086, %int32_6379, %int100_6380 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5088 = torch.aten.view %5084, %5087 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_6381 = torch.constant.int 0 %int0_6382 = torch.constant.int 0 %int9223372036854775807_6383 = torch.constant.int 9223372036854775807 %int1_6384 = torch.constant.int 1 %5089 = torch.aten.slice.Tensor %4830, %int0_6381, %int0_6382, %int9223372036854775807_6383, %int1_6384 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_6385 = torch.constant.int 16 %5090 = torch.aten.mul.int %655, %int16_6385 : !torch.int, !torch.int -> !torch.int %int1_6386 = torch.constant.int 1 %int0_6387 = torch.constant.int 0 %int1_6388 = torch.constant.int 1 %5091 = torch.aten.slice.Tensor %5089, %int1_6386, %int0_6387, %5090, %int1_6388 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_6389 = torch.constant.bool false %5092 = torch.aten.copy %5091, %5088, %false_6389 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_6390 = torch.constant.int 0 %int0_6391 = torch.constant.int 0 %int9223372036854775807_6392 = torch.constant.int 9223372036854775807 %int1_6393 = torch.constant.int 1 %5093 = torch.aten.slice.Tensor %4830, %int0_6390, %int0_6391, %int9223372036854775807_6392, %int1_6393 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6394 = torch.constant.int 1 %int0_6395 = torch.constant.int 0 %int1_6396 = torch.constant.int 1 %5094 = torch.aten.slice_scatter %5093, %5092, %int1_6394, %int0_6395, %5090, %int1_6396 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_6397 = torch.constant.int 0 %int0_6398 = torch.constant.int 0 %int9223372036854775807_6399 = torch.constant.int 9223372036854775807 %int1_6400 = torch.constant.int 1 %5095 = torch.aten.slice_scatter %4830, %5094, %int0_6397, %int0_6398, %int9223372036854775807_6399, %int1_6400 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6401 = torch.constant.int 1 %int1_6402 = torch.constant.int 1 %5096 = torch.aten.add.Scalar %5072, %int1_6401, %int1_6402 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_6403 = torch.constant.int 4 %5097 = torch.aten.mul.int %int4_6403, %655 : !torch.int, !torch.int -> !torch.int %5098 = torch.prim.ListConstruct %5097 : (!torch.int) -> !torch.list %5099 = torch.aten.view %5096, %5098 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_6404 = torch.constant.int 0 %5100 = torch.aten.index_select %5081, %int0_6404, %5099 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_6405 = torch.constant.int 4 %int16_6406 = torch.constant.int 16 %int32_6407 = torch.constant.int 32 %int100_6408 = torch.constant.int 100 %5101 = torch.prim.ListConstruct %int4_6405, %655, %int16_6406, %int32_6407, %int100_6408 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5102 = torch.aten.view %5100, %5101 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_6409 = torch.constant.int 1 %5103 = torch.aten.size.int %5102, %int1_6409 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_6410 = torch.constant.int 16 %5104 = torch.aten.mul.int %5103, %int16_6410 : !torch.int, !torch.int -> !torch.int %int4_6411 = torch.constant.int 4 %int32_6412 = torch.constant.int 32 %int100_6413 = torch.constant.int 100 %5105 = torch.prim.ListConstruct %int4_6411, %5104, %int32_6412, %int100_6413 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5106 = torch.aten.view %5102, %5105 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_6414 = torch.constant.int 0 %int0_6415 = torch.constant.int 0 %int9223372036854775807_6416 = torch.constant.int 9223372036854775807 %int1_6417 = torch.constant.int 1 %5107 = torch.aten.slice.Tensor %4847, %int0_6414, %int0_6415, %int9223372036854775807_6416, %int1_6417 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6418 = torch.constant.int 1 %int0_6419 = torch.constant.int 0 %int1_6420 = torch.constant.int 1 %5108 = torch.aten.slice.Tensor %5107, %int1_6418, %int0_6419, %5090, %int1_6420 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_6421 = torch.constant.bool false %5109 = torch.aten.copy %5108, %5106, %false_6421 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_6422 = torch.constant.int 0 %int0_6423 = torch.constant.int 0 %int9223372036854775807_6424 = torch.constant.int 9223372036854775807 %int1_6425 = torch.constant.int 1 %5110 = torch.aten.slice.Tensor %4847, %int0_6422, %int0_6423, %int9223372036854775807_6424, %int1_6425 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6426 = torch.constant.int 1 %int0_6427 = torch.constant.int 0 %int1_6428 = torch.constant.int 1 %5111 = torch.aten.slice_scatter %5110, %5109, %int1_6426, %int0_6427, %5090, %int1_6428 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_6429 = torch.constant.int 0 %int0_6430 = torch.constant.int 0 %int9223372036854775807_6431 = torch.constant.int 9223372036854775807 %int1_6432 = torch.constant.int 1 %5112 = torch.aten.slice_scatter %4847, %5111, %int0_6429, %int0_6430, %int9223372036854775807_6431, %int1_6432 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_6433 = torch.constant.int 0 %int0_6434 = torch.constant.int 0 %int9223372036854775807_6435 = torch.constant.int 9223372036854775807 %int1_6436 = torch.constant.int 1 %5113 = torch.aten.slice.Tensor %671, %int0_6433, %int0_6434, %int9223372036854775807_6435, %int1_6436 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6437 = torch.constant.int 1 %int0_6438 = torch.constant.int 0 %int1_6439 = torch.constant.int 1 %5114 = torch.aten.slice.Tensor %5113, %int1_6437, %int0_6438, %5090, %int1_6439 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_6440 = torch.constant.int 0 %int0_6441 = torch.constant.int 0 %int9223372036854775807_6442 = torch.constant.int 9223372036854775807 %int1_6443 = torch.constant.int 1 %5115 = torch.aten.slice.Tensor %673, %int0_6440, %int0_6441, %int9223372036854775807_6442, %int1_6443 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6444 = torch.constant.int 1 %int0_6445 = torch.constant.int 0 %int1_6446 = torch.constant.int 1 %5116 = torch.aten.slice.Tensor %5115, %int1_6444, %int0_6445, %5090, %int1_6446 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_6447 = torch.constant.int 1 %int2_6448 = torch.constant.int 2 %5117 = torch.aten.transpose.int %4953, %int1_6447, %int2_6448 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_6449 = torch.constant.int 4 %int32_6450 = torch.constant.int 32 %int1_6451 = torch.constant.int 1 %int100_6452 = torch.constant.int 100 %5118 = torch.prim.ListConstruct %int4_6449, %int32_6450, %int1_6451, %int100_6452 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6453 = torch.constant.bool false %5119 = torch.aten.expand %5117, %5118, %false_6453 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_6454 = torch.constant.int 128 %int1_6455 = torch.constant.int 1 %int100_6456 = torch.constant.int 100 %5120 = torch.prim.ListConstruct %int128_6454, %int1_6455, %int100_6456 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5121 = torch.aten.view %5119, %5120 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_6457 = torch.constant.int 0 %int0_6458 = torch.constant.int 0 %int9223372036854775807_6459 = torch.constant.int 9223372036854775807 %int1_6460 = torch.constant.int 1 %5122 = torch.aten.slice.Tensor %5095, %int0_6457, %int0_6458, %int9223372036854775807_6459, %int1_6460 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6461 = torch.constant.int 1 %int0_6462 = torch.constant.int 0 %int1_6463 = torch.constant.int 1 %5123 = torch.aten.slice.Tensor %5122, %int1_6461, %int0_6462, %5090, %int1_6463 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_6464 = torch.constant.int 1 %int2_6465 = torch.constant.int 2 %5124 = torch.aten.transpose.int %5123, %int1_6464, %int2_6465 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_6466 = torch.constant.int 2 %int3_6467 = torch.constant.int 3 %5125 = torch.aten.transpose.int %5124, %int2_6466, %int3_6467 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_6468 = torch.constant.int 1 %5126 = torch.aten.size.int %5114, %int1_6468 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_6469 = torch.constant.int 4 %int32_6470 = torch.constant.int 32 %int100_6471 = torch.constant.int 100 %5127 = torch.prim.ListConstruct %int4_6469, %int32_6470, %int100_6471, %5126 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6472 = torch.constant.bool false %5128 = torch.aten.expand %5125, %5127, %false_6472 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_6473 = torch.constant.int 0 %5129 = torch.aten.clone %5128, %int0_6473 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_6474 = torch.constant.int 128 %int100_6475 = torch.constant.int 100 %5130 = torch.prim.ListConstruct %int128_6474, %int100_6475, %5126 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5131 = torch.aten._unsafe_view %5129, %5130 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %5132 = torch.aten.bmm %5121, %5131 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_6476 = torch.constant.int 4 %int32_6477 = torch.constant.int 32 %int1_6478 = torch.constant.int 1 %5133 = torch.prim.ListConstruct %int4_6476, %int32_6477, %int1_6478, %5126 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5134 = torch.aten.view %5132, %5133 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_6479 = torch.constant.float 1.000000e+01 %5135 = torch.aten.div.Scalar %5134, %float1.000000e01_6479 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_6480 = torch.constant.int 1 %5136 = torch.aten.add.Tensor %5135, %895, %int1_6480 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_6481 = torch.constant.int -1 %false_6482 = torch.constant.bool false %5137 = torch.aten._softmax %5136, %int-1_6481, %false_6482 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_6483 = torch.constant.int 4 %int32_6484 = torch.constant.int 32 %int1_6485 = torch.constant.int 1 %5138 = torch.prim.ListConstruct %int4_6483, %int32_6484, %int1_6485, %5126 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6486 = torch.constant.bool false %5139 = torch.aten.expand %5137, %5138, %false_6486 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_6487 = torch.constant.int 128 %int1_6488 = torch.constant.int 1 %5140 = torch.prim.ListConstruct %int128_6487, %int1_6488, %5126 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5141 = torch.aten.view %5139, %5140 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_6489 = torch.constant.int 0 %int0_6490 = torch.constant.int 0 %int9223372036854775807_6491 = torch.constant.int 9223372036854775807 %int1_6492 = torch.constant.int 1 %5142 = torch.aten.slice.Tensor %5112, %int0_6489, %int0_6490, %int9223372036854775807_6491, %int1_6492 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6493 = torch.constant.int 1 %int0_6494 = torch.constant.int 0 %int1_6495 = torch.constant.int 1 %5143 = torch.aten.slice.Tensor %5142, %int1_6493, %int0_6494, %5090, %int1_6495 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_6496 = torch.constant.int 1 %int2_6497 = torch.constant.int 2 %5144 = torch.aten.transpose.int %5143, %int1_6496, %int2_6497 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_6498 = torch.constant.int 1 %5145 = torch.aten.size.int %5116, %int1_6498 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_6499 = torch.constant.int 4 %int32_6500 = torch.constant.int 32 %int100_6501 = torch.constant.int 100 %5146 = torch.prim.ListConstruct %int4_6499, %int32_6500, %5145, %int100_6501 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6502 = torch.constant.bool false %5147 = torch.aten.expand %5144, %5146, %false_6502 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_6503 = torch.constant.int 0 %5148 = torch.aten.clone %5147, %int0_6503 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_6504 = torch.constant.int 128 %int100_6505 = torch.constant.int 100 %5149 = torch.prim.ListConstruct %int128_6504, %5145, %int100_6505 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5150 = torch.aten._unsafe_view %5148, %5149 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %5151 = torch.aten.bmm %5141, %5150 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_6506 = torch.constant.int 4 %int32_6507 = torch.constant.int 32 %int1_6508 = torch.constant.int 1 %int100_6509 = torch.constant.int 100 %5152 = torch.prim.ListConstruct %int4_6506, %int32_6507, %int1_6508, %int100_6509 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5153 = torch.aten.view %5151, %5152 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_6510 = torch.constant.int 1 %int2_6511 = torch.constant.int 2 %5154 = torch.aten.transpose.int %5153, %int1_6510, %int2_6511 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_6512 = torch.constant.int 4 %int1_6513 = torch.constant.int 1 %int-1_6514 = torch.constant.int -1 %5155 = torch.prim.ListConstruct %int4_6512, %int1_6513, %int-1_6514 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5156 = torch.aten.view %5154, %5155 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %5157 = torch_c.to_builtin_tensor %5156 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6515 = tensor.cast %5157 : tensor<4x1x3200xf32> to tensor %5158 = torch_c.to_builtin_tensor %150 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5159 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6515, %5158) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6516 = tensor.cast %5159 : tensor to tensor<4x1x3200xf32> %5160 = torch_c.from_builtin_tensor %cast_6516 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_6517 = torch.constant.int 1 %5161 = torch.aten.add.Tensor %4918, %5160, %int1_6517 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_6518 = torch.constant.int 2 %5162 = torch.aten.pow.Tensor_Scalar %5161, %int2_6518 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_6519 = torch.constant.int -1 %5163 = torch.prim.ListConstruct %int-1_6519 : (!torch.int) -> !torch.list %true_6520 = torch.constant.bool true %none_6521 = torch.constant.none %5164 = torch.aten.mean.dim %5162, %5163, %true_6520, %none_6521 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_6522 = torch.constant.float 9.9999999747524271E-7 %int1_6523 = torch.constant.int 1 %5165 = torch.aten.add.Scalar %5164, %float9.999990e-07_6522, %int1_6523 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %5166 = torch.aten.rsqrt %5165 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %5167 = torch.aten.mul.Tensor %5161, %5166 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %5168 = torch.aten.mul.Tensor %5167, %151 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %5169 = torch_c.to_builtin_tensor %5168 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6524 = tensor.cast %5169 : tensor<4x1x3200xf32> to tensor %5170 = torch_c.to_builtin_tensor %152 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %5171 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_6524, %5170) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_6525 = tensor.cast %5171 : tensor to tensor<4x1x8640xf32> %5172 = torch_c.from_builtin_tensor %cast_6525 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %5173 = torch.aten.silu %5172 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %5174 = torch_c.to_builtin_tensor %5168 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6526 = tensor.cast %5174 : tensor<4x1x3200xf32> to tensor %5175 = torch_c.to_builtin_tensor %153 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %5176 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_6526, %5175) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_6527 = tensor.cast %5176 : tensor to tensor<4x1x8640xf32> %5177 = torch_c.from_builtin_tensor %cast_6527 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %5178 = torch.aten.mul.Tensor %5173, %5177 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %5179 = torch_c.to_builtin_tensor %5178 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_6528 = tensor.cast %5179 : tensor<4x1x8640xf32> to tensor %5180 = torch_c.to_builtin_tensor %154 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %5181 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_6528, %5180) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_6529 = tensor.cast %5181 : tensor to tensor<4x1x3200xf32> %5182 = torch_c.from_builtin_tensor %cast_6529 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_6530 = torch.constant.int 1 %5183 = torch.aten.add.Tensor %5161, %5182, %int1_6530 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_6531 = torch.constant.int 2 %5184 = torch.aten.pow.Tensor_Scalar %5183, %int2_6531 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_6532 = torch.constant.int -1 %5185 = torch.prim.ListConstruct %int-1_6532 : (!torch.int) -> !torch.list %true_6533 = torch.constant.bool true %none_6534 = torch.constant.none %5186 = torch.aten.mean.dim %5184, %5185, %true_6533, %none_6534 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_6535 = torch.constant.float 9.9999999747524271E-7 %int1_6536 = torch.constant.int 1 %5187 = torch.aten.add.Scalar %5186, %float9.999990e-07_6535, %int1_6536 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %5188 = torch.aten.rsqrt %5187 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %5189 = torch.aten.mul.Tensor %5183, %5188 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %5190 = torch.aten.mul.Tensor %5189, %155 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %5191 = torch_c.to_builtin_tensor %5190 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6537 = tensor.cast %5191 : tensor<4x1x3200xf32> to tensor %5192 = torch_c.to_builtin_tensor %156 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5193 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6537, %5192) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6538 = tensor.cast %5193 : tensor to tensor<4x1x3200xf32> %5194 = torch_c.from_builtin_tensor %cast_6538 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %5195 = torch_c.to_builtin_tensor %5190 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6539 = tensor.cast %5195 : tensor<4x1x3200xf32> to tensor %5196 = torch_c.to_builtin_tensor %157 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5197 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6539, %5196) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6540 = tensor.cast %5197 : tensor to tensor<4x1x3200xf32> %5198 = torch_c.from_builtin_tensor %cast_6540 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %5199 = torch_c.to_builtin_tensor %5190 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6541 = tensor.cast %5199 : tensor<4x1x3200xf32> to tensor %5200 = torch_c.to_builtin_tensor %158 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5201 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6541, %5200) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6542 = tensor.cast %5201 : tensor to tensor<4x1x3200xf32> %5202 = torch_c.from_builtin_tensor %cast_6542 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_6543 = torch.constant.int 4 %int1_6544 = torch.constant.int 1 %int32_6545 = torch.constant.int 32 %int100_6546 = torch.constant.int 100 %5203 = torch.prim.ListConstruct %int4_6543, %int1_6544, %int32_6545, %int100_6546 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5204 = torch.aten.view %5194, %5203 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_6547 = torch.constant.int 4 %int1_6548 = torch.constant.int 1 %int32_6549 = torch.constant.int 32 %int100_6550 = torch.constant.int 100 %5205 = torch.prim.ListConstruct %int4_6547, %int1_6548, %int32_6549, %int100_6550 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5206 = torch.aten.view %5198, %5205 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_6551 = torch.constant.int 4 %int1_6552 = torch.constant.int 1 %int32_6553 = torch.constant.int 32 %int100_6554 = torch.constant.int 100 %5207 = torch.prim.ListConstruct %int4_6551, %int1_6552, %int32_6553, %int100_6554 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5208 = torch.aten.view %5202, %5207 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_6555 = torch.constant.int 4 %int1_6556 = torch.constant.int 1 %int32_6557 = torch.constant.int 32 %int-1_6558 = torch.constant.int -1 %int2_6559 = torch.constant.int 2 %5209 = torch.prim.ListConstruct %int4_6555, %int1_6556, %int32_6557, %int-1_6558, %int2_6559 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5210 = torch.aten.view %5204, %5209 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %5211 = torch.aten.view_as_complex %5210 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_6560 = torch.constant.int 4 %int1_6561 = torch.constant.int 1 %int32_6562 = torch.constant.int 32 %int-1_6563 = torch.constant.int -1 %int2_6564 = torch.constant.int 2 %5212 = torch.prim.ListConstruct %int4_6560, %int1_6561, %int32_6562, %int-1_6563, %int2_6564 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5213 = torch.aten.view %5206, %5212 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %5214 = torch.aten.view_as_complex %5213 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %5215 = torch.aten.mul.Tensor %5211, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %5216 = torch.aten.view_as_real %5215 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_6565 = torch.constant.int 4 %int1_6566 = torch.constant.int 1 %int32_6567 = torch.constant.int 32 %int100_6568 = torch.constant.int 100 %5217 = torch.prim.ListConstruct %int4_6565, %int1_6566, %int32_6567, %int100_6568 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5218 = torch.aten.view %5216, %5217 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %5219 = torch.aten.mul.Tensor %5214, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %5220 = torch.aten.view_as_real %5219 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_6569 = torch.constant.int 4 %int1_6570 = torch.constant.int 1 %int32_6571 = torch.constant.int 32 %int100_6572 = torch.constant.int 100 %5221 = torch.prim.ListConstruct %int4_6569, %int1_6570, %int32_6571, %int100_6572 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5222 = torch.aten.view %5220, %5221 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_6573 = torch.constant.int 1 %int1_6574 = torch.constant.int 1 %5223 = torch.aten.add.Scalar %arg2, %int1_6573, %int1_6574 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_6575 = torch.constant.int 0 %int0_6576 = torch.constant.int 0 %5224 = torch.aten.select.int %5223, %int0_6575, %int0_6576 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_6577 = torch.constant.int 0 %int0_6578 = torch.constant.int 0 %5225 = torch.aten.select.int %arg3, %int0_6577, %int0_6578 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_6579 = torch.constant.int 0 %int0_6580 = torch.constant.int 0 %int9223372036854775807_6581 = torch.constant.int 9223372036854775807 %int1_6582 = torch.constant.int 1 %5226 = torch.aten.slice.Tensor %5225, %int0_6579, %int0_6580, %int9223372036854775807_6581, %int1_6582 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_6583 = torch.constant.int 16 %5227 = torch.aten.floor_divide.Scalar %5224, %int16_6583 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_6584 = torch.constant.int 0 %5228 = torch.aten.index_select %5226, %int0_6584, %5227 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_6585 = torch.constant.int 16 %5229 = torch.aten.remainder.Scalar %5224, %int16_6585 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_6586 = torch.constant.none %5230 = torch.aten.clone %510, %none_6586 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6587 = torch.constant.none %5231 = torch.aten.clone %511, %none_6587 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6588 = torch.constant.int 0 %5232 = torch.aten.unsqueeze %5229, %int0_6588 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6589 = torch.constant.int 0 %int0_6590 = torch.constant.int 0 %5233 = torch.aten.select.int %5222, %int0_6589, %int0_6590 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6591 = torch.constant.int 0 %int0_6592 = torch.constant.int 0 %5234 = torch.aten.select.int %5233, %int0_6591, %int0_6592 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_6593 = torch.constant.int -1 %int26_6594 = torch.constant.int 26 %int2_6595 = torch.constant.int 2 %int16_6596 = torch.constant.int 16 %int32_6597 = torch.constant.int 32 %int100_6598 = torch.constant.int 100 %5235 = torch.prim.ListConstruct %int-1_6593, %int26_6594, %int2_6595, %int16_6596, %int32_6597, %int100_6598 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5236 = torch.aten.view %5070, %5235 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %5237 = torch.prim.ListConstruct %5228, %5230, %5231, %5232 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6599 = torch.constant.bool false %5238 = torch.aten.index_put %5236, %5237, %5234, %false_6599 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6600 = torch.constant.int 2662400 %5239 = torch.prim.ListConstruct %731, %int2662400_6600 : (!torch.int, !torch.int) -> !torch.list %5240 = torch.aten.view %5238, %5239 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6601 = torch.constant.int -1 %int26_6602 = torch.constant.int 26 %int2_6603 = torch.constant.int 2 %int16_6604 = torch.constant.int 16 %int32_6605 = torch.constant.int 32 %int100_6606 = torch.constant.int 100 %5241 = torch.prim.ListConstruct %int-1_6601, %int26_6602, %int2_6603, %int16_6604, %int32_6605, %int100_6606 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5242 = torch.aten.view %5240, %5241 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_6607 = torch.constant.none %5243 = torch.aten.clone %512, %none_6607 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6608 = torch.constant.none %5244 = torch.aten.clone %513, %none_6608 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6609 = torch.constant.int 0 %5245 = torch.aten.unsqueeze %5229, %int0_6609 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6610 = torch.constant.int 0 %int0_6611 = torch.constant.int 0 %5246 = torch.aten.select.int %5208, %int0_6610, %int0_6611 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6612 = torch.constant.int 0 %int0_6613 = torch.constant.int 0 %5247 = torch.aten.select.int %5246, %int0_6612, %int0_6613 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5248 = torch.prim.ListConstruct %5228, %5243, %5244, %5245 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6614 = torch.constant.bool false %5249 = torch.aten.index_put %5242, %5248, %5247, %false_6614 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6615 = torch.constant.int 2662400 %5250 = torch.prim.ListConstruct %731, %int2662400_6615 : (!torch.int, !torch.int) -> !torch.list %5251 = torch.aten.view %5249, %5250 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6616 = torch.constant.int -1 %int26_6617 = torch.constant.int 26 %int2_6618 = torch.constant.int 2 %int16_6619 = torch.constant.int 16 %int32_6620 = torch.constant.int 32 %int100_6621 = torch.constant.int 100 %5252 = torch.prim.ListConstruct %int-1_6616, %int26_6617, %int2_6618, %int16_6619, %int32_6620, %int100_6621 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5253 = torch.aten.view %5251, %5252 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_6622 = torch.constant.int 0 %int1_6623 = torch.constant.int 1 %5254 = torch.aten.select.int %5223, %int0_6622, %int1_6623 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_6624 = torch.constant.int 0 %int1_6625 = torch.constant.int 1 %5255 = torch.aten.select.int %arg3, %int0_6624, %int1_6625 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_6626 = torch.constant.int 0 %int0_6627 = torch.constant.int 0 %int9223372036854775807_6628 = torch.constant.int 9223372036854775807 %int1_6629 = torch.constant.int 1 %5256 = torch.aten.slice.Tensor %5255, %int0_6626, %int0_6627, %int9223372036854775807_6628, %int1_6629 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_6630 = torch.constant.int 16 %5257 = torch.aten.floor_divide.Scalar %5254, %int16_6630 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_6631 = torch.constant.int 0 %5258 = torch.aten.index_select %5256, %int0_6631, %5257 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_6632 = torch.constant.int 16 %5259 = torch.aten.remainder.Scalar %5254, %int16_6632 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_6633 = torch.constant.none %5260 = torch.aten.clone %514, %none_6633 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6634 = torch.constant.none %5261 = torch.aten.clone %515, %none_6634 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6635 = torch.constant.int 0 %5262 = torch.aten.unsqueeze %5259, %int0_6635 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6636 = torch.constant.int 0 %int1_6637 = torch.constant.int 1 %5263 = torch.aten.select.int %5222, %int0_6636, %int1_6637 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6638 = torch.constant.int 0 %int0_6639 = torch.constant.int 0 %5264 = torch.aten.select.int %5263, %int0_6638, %int0_6639 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5265 = torch.prim.ListConstruct %5258, %5260, %5261, %5262 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6640 = torch.constant.bool false %5266 = torch.aten.index_put %5253, %5265, %5264, %false_6640 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6641 = torch.constant.int 2662400 %5267 = torch.prim.ListConstruct %731, %int2662400_6641 : (!torch.int, !torch.int) -> !torch.list %5268 = torch.aten.view %5266, %5267 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6642 = torch.constant.int -1 %int26_6643 = torch.constant.int 26 %int2_6644 = torch.constant.int 2 %int16_6645 = torch.constant.int 16 %int32_6646 = torch.constant.int 32 %int100_6647 = torch.constant.int 100 %5269 = torch.prim.ListConstruct %int-1_6642, %int26_6643, %int2_6644, %int16_6645, %int32_6646, %int100_6647 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5270 = torch.aten.view %5268, %5269 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_6648 = torch.constant.none %5271 = torch.aten.clone %516, %none_6648 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6649 = torch.constant.none %5272 = torch.aten.clone %517, %none_6649 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6650 = torch.constant.int 0 %5273 = torch.aten.unsqueeze %5259, %int0_6650 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6651 = torch.constant.int 0 %int1_6652 = torch.constant.int 1 %5274 = torch.aten.select.int %5208, %int0_6651, %int1_6652 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6653 = torch.constant.int 0 %int0_6654 = torch.constant.int 0 %5275 = torch.aten.select.int %5274, %int0_6653, %int0_6654 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5276 = torch.prim.ListConstruct %5258, %5271, %5272, %5273 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6655 = torch.constant.bool false %5277 = torch.aten.index_put %5270, %5276, %5275, %false_6655 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6656 = torch.constant.int 2662400 %5278 = torch.prim.ListConstruct %731, %int2662400_6656 : (!torch.int, !torch.int) -> !torch.list %5279 = torch.aten.view %5277, %5278 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6657 = torch.constant.int -1 %int26_6658 = torch.constant.int 26 %int2_6659 = torch.constant.int 2 %int16_6660 = torch.constant.int 16 %int32_6661 = torch.constant.int 32 %int100_6662 = torch.constant.int 100 %5280 = torch.prim.ListConstruct %int-1_6657, %int26_6658, %int2_6659, %int16_6660, %int32_6661, %int100_6662 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5281 = torch.aten.view %5279, %5280 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_6663 = torch.constant.int 0 %int2_6664 = torch.constant.int 2 %5282 = torch.aten.select.int %5223, %int0_6663, %int2_6664 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_6665 = torch.constant.int 0 %int2_6666 = torch.constant.int 2 %5283 = torch.aten.select.int %arg3, %int0_6665, %int2_6666 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_6667 = torch.constant.int 0 %int0_6668 = torch.constant.int 0 %int9223372036854775807_6669 = torch.constant.int 9223372036854775807 %int1_6670 = torch.constant.int 1 %5284 = torch.aten.slice.Tensor %5283, %int0_6667, %int0_6668, %int9223372036854775807_6669, %int1_6670 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_6671 = torch.constant.int 16 %5285 = torch.aten.floor_divide.Scalar %5282, %int16_6671 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_6672 = torch.constant.int 0 %5286 = torch.aten.index_select %5284, %int0_6672, %5285 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_6673 = torch.constant.int 16 %5287 = torch.aten.remainder.Scalar %5282, %int16_6673 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_6674 = torch.constant.none %5288 = torch.aten.clone %518, %none_6674 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6675 = torch.constant.none %5289 = torch.aten.clone %519, %none_6675 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6676 = torch.constant.int 0 %5290 = torch.aten.unsqueeze %5287, %int0_6676 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6677 = torch.constant.int 0 %int2_6678 = torch.constant.int 2 %5291 = torch.aten.select.int %5222, %int0_6677, %int2_6678 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6679 = torch.constant.int 0 %int0_6680 = torch.constant.int 0 %5292 = torch.aten.select.int %5291, %int0_6679, %int0_6680 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5293 = torch.prim.ListConstruct %5286, %5288, %5289, %5290 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6681 = torch.constant.bool false %5294 = torch.aten.index_put %5281, %5293, %5292, %false_6681 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6682 = torch.constant.int 2662400 %5295 = torch.prim.ListConstruct %731, %int2662400_6682 : (!torch.int, !torch.int) -> !torch.list %5296 = torch.aten.view %5294, %5295 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6683 = torch.constant.int -1 %int26_6684 = torch.constant.int 26 %int2_6685 = torch.constant.int 2 %int16_6686 = torch.constant.int 16 %int32_6687 = torch.constant.int 32 %int100_6688 = torch.constant.int 100 %5297 = torch.prim.ListConstruct %int-1_6683, %int26_6684, %int2_6685, %int16_6686, %int32_6687, %int100_6688 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5298 = torch.aten.view %5296, %5297 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_6689 = torch.constant.none %5299 = torch.aten.clone %520, %none_6689 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6690 = torch.constant.none %5300 = torch.aten.clone %521, %none_6690 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6691 = torch.constant.int 0 %5301 = torch.aten.unsqueeze %5287, %int0_6691 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6692 = torch.constant.int 0 %int2_6693 = torch.constant.int 2 %5302 = torch.aten.select.int %5208, %int0_6692, %int2_6693 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6694 = torch.constant.int 0 %int0_6695 = torch.constant.int 0 %5303 = torch.aten.select.int %5302, %int0_6694, %int0_6695 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5304 = torch.prim.ListConstruct %5286, %5299, %5300, %5301 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6696 = torch.constant.bool false %5305 = torch.aten.index_put %5298, %5304, %5303, %false_6696 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6697 = torch.constant.int 2662400 %5306 = torch.prim.ListConstruct %731, %int2662400_6697 : (!torch.int, !torch.int) -> !torch.list %5307 = torch.aten.view %5305, %5306 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6698 = torch.constant.int -1 %int26_6699 = torch.constant.int 26 %int2_6700 = torch.constant.int 2 %int16_6701 = torch.constant.int 16 %int32_6702 = torch.constant.int 32 %int100_6703 = torch.constant.int 100 %5308 = torch.prim.ListConstruct %int-1_6698, %int26_6699, %int2_6700, %int16_6701, %int32_6702, %int100_6703 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5309 = torch.aten.view %5307, %5308 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_6704 = torch.constant.int 0 %int3_6705 = torch.constant.int 3 %5310 = torch.aten.select.int %5223, %int0_6704, %int3_6705 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_6706 = torch.constant.int 0 %int3_6707 = torch.constant.int 3 %5311 = torch.aten.select.int %arg3, %int0_6706, %int3_6707 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_6708 = torch.constant.int 0 %int0_6709 = torch.constant.int 0 %int9223372036854775807_6710 = torch.constant.int 9223372036854775807 %int1_6711 = torch.constant.int 1 %5312 = torch.aten.slice.Tensor %5311, %int0_6708, %int0_6709, %int9223372036854775807_6710, %int1_6711 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_6712 = torch.constant.int 16 %5313 = torch.aten.floor_divide.Scalar %5310, %int16_6712 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_6713 = torch.constant.int 0 %5314 = torch.aten.index_select %5312, %int0_6713, %5313 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_6714 = torch.constant.int 16 %5315 = torch.aten.remainder.Scalar %5310, %int16_6714 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_6715 = torch.constant.none %5316 = torch.aten.clone %522, %none_6715 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6716 = torch.constant.none %5317 = torch.aten.clone %523, %none_6716 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6717 = torch.constant.int 0 %5318 = torch.aten.unsqueeze %5315, %int0_6717 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6718 = torch.constant.int 0 %int3_6719 = torch.constant.int 3 %5319 = torch.aten.select.int %5222, %int0_6718, %int3_6719 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6720 = torch.constant.int 0 %int0_6721 = torch.constant.int 0 %5320 = torch.aten.select.int %5319, %int0_6720, %int0_6721 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5321 = torch.prim.ListConstruct %5314, %5316, %5317, %5318 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6722 = torch.constant.bool false %5322 = torch.aten.index_put %5309, %5321, %5320, %false_6722 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6723 = torch.constant.int 2662400 %5323 = torch.prim.ListConstruct %731, %int2662400_6723 : (!torch.int, !torch.int) -> !torch.list %5324 = torch.aten.view %5322, %5323 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6724 = torch.constant.int -1 %int26_6725 = torch.constant.int 26 %int2_6726 = torch.constant.int 2 %int16_6727 = torch.constant.int 16 %int32_6728 = torch.constant.int 32 %int100_6729 = torch.constant.int 100 %5325 = torch.prim.ListConstruct %int-1_6724, %int26_6725, %int2_6726, %int16_6727, %int32_6728, %int100_6729 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5326 = torch.aten.view %5324, %5325 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_6730 = torch.constant.none %5327 = torch.aten.clone %524, %none_6730 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6731 = torch.constant.none %5328 = torch.aten.clone %525, %none_6731 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6732 = torch.constant.int 0 %5329 = torch.aten.unsqueeze %5315, %int0_6732 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6733 = torch.constant.int 0 %int3_6734 = torch.constant.int 3 %5330 = torch.aten.select.int %5208, %int0_6733, %int3_6734 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6735 = torch.constant.int 0 %int0_6736 = torch.constant.int 0 %5331 = torch.aten.select.int %5330, %int0_6735, %int0_6736 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5332 = torch.prim.ListConstruct %5314, %5327, %5328, %5329 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6737 = torch.constant.bool false %5333 = torch.aten.index_put %5326, %5332, %5331, %false_6737 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6738 = torch.constant.int 2662400 %5334 = torch.prim.ListConstruct %731, %int2662400_6738 : (!torch.int, !torch.int) -> !torch.list %5335 = torch.aten.view %5333, %5334 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_6739 = torch.constant.int 52 %5336 = torch.aten.mul.Scalar %arg3, %int52_6739 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int34 = torch.constant.int 34 %int1_6740 = torch.constant.int 1 %5337 = torch.aten.add.Scalar %5336, %int34, %int1_6740 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_6741 = torch.constant.int 4 %5338 = torch.aten.mul.int %int4_6741, %655 : !torch.int, !torch.int -> !torch.int %5339 = torch.prim.ListConstruct %5338 : (!torch.int) -> !torch.list %5340 = torch.aten.view %5337, %5339 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_6742 = torch.constant.int -1 %int26_6743 = torch.constant.int 26 %int2_6744 = torch.constant.int 2 %int16_6745 = torch.constant.int 16 %int32_6746 = torch.constant.int 32 %int100_6747 = torch.constant.int 100 %5341 = torch.prim.ListConstruct %int-1_6742, %int26_6743, %int2_6744, %int16_6745, %int32_6746, %int100_6747 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5342 = torch.aten.view %5335, %5341 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_6748 = torch.constant.int 26 %5343 = torch.aten.mul.int %731, %int26_6748 : !torch.int, !torch.int -> !torch.int %int2_6749 = torch.constant.int 2 %5344 = torch.aten.mul.int %5343, %int2_6749 : !torch.int, !torch.int -> !torch.int %int16_6750 = torch.constant.int 16 %int32_6751 = torch.constant.int 32 %int100_6752 = torch.constant.int 100 %5345 = torch.prim.ListConstruct %5344, %int16_6750, %int32_6751, %int100_6752 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5346 = torch.aten.view %5342, %5345 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_6753 = torch.constant.int 0 %5347 = torch.aten.index_select %5346, %int0_6753, %5340 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_6754 = torch.constant.int 4 %int16_6755 = torch.constant.int 16 %int32_6756 = torch.constant.int 32 %int100_6757 = torch.constant.int 100 %5348 = torch.prim.ListConstruct %int4_6754, %655, %int16_6755, %int32_6756, %int100_6757 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5349 = torch.aten.view %5347, %5348 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_6758 = torch.constant.int 1 %5350 = torch.aten.size.int %5349, %int1_6758 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_6759 = torch.constant.int 16 %5351 = torch.aten.mul.int %5350, %int16_6759 : !torch.int, !torch.int -> !torch.int %int4_6760 = torch.constant.int 4 %int32_6761 = torch.constant.int 32 %int100_6762 = torch.constant.int 100 %5352 = torch.prim.ListConstruct %int4_6760, %5351, %int32_6761, %int100_6762 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5353 = torch.aten.view %5349, %5352 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_6763 = torch.constant.int 0 %int0_6764 = torch.constant.int 0 %int9223372036854775807_6765 = torch.constant.int 9223372036854775807 %int1_6766 = torch.constant.int 1 %5354 = torch.aten.slice.Tensor %5095, %int0_6763, %int0_6764, %int9223372036854775807_6765, %int1_6766 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_6767 = torch.constant.int 16 %5355 = torch.aten.mul.int %655, %int16_6767 : !torch.int, !torch.int -> !torch.int %int1_6768 = torch.constant.int 1 %int0_6769 = torch.constant.int 0 %int1_6770 = torch.constant.int 1 %5356 = torch.aten.slice.Tensor %5354, %int1_6768, %int0_6769, %5355, %int1_6770 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_6771 = torch.constant.bool false %5357 = torch.aten.copy %5356, %5353, %false_6771 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_6772 = torch.constant.int 0 %int0_6773 = torch.constant.int 0 %int9223372036854775807_6774 = torch.constant.int 9223372036854775807 %int1_6775 = torch.constant.int 1 %5358 = torch.aten.slice.Tensor %5095, %int0_6772, %int0_6773, %int9223372036854775807_6774, %int1_6775 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6776 = torch.constant.int 1 %int0_6777 = torch.constant.int 0 %int1_6778 = torch.constant.int 1 %5359 = torch.aten.slice_scatter %5358, %5357, %int1_6776, %int0_6777, %5355, %int1_6778 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_6779 = torch.constant.int 0 %int0_6780 = torch.constant.int 0 %int9223372036854775807_6781 = torch.constant.int 9223372036854775807 %int1_6782 = torch.constant.int 1 %5360 = torch.aten.slice_scatter %5095, %5359, %int0_6779, %int0_6780, %int9223372036854775807_6781, %int1_6782 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6783 = torch.constant.int 1 %int1_6784 = torch.constant.int 1 %5361 = torch.aten.add.Scalar %5337, %int1_6783, %int1_6784 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_6785 = torch.constant.int 4 %5362 = torch.aten.mul.int %int4_6785, %655 : !torch.int, !torch.int -> !torch.int %5363 = torch.prim.ListConstruct %5362 : (!torch.int) -> !torch.list %5364 = torch.aten.view %5361, %5363 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_6786 = torch.constant.int 0 %5365 = torch.aten.index_select %5346, %int0_6786, %5364 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_6787 = torch.constant.int 4 %int16_6788 = torch.constant.int 16 %int32_6789 = torch.constant.int 32 %int100_6790 = torch.constant.int 100 %5366 = torch.prim.ListConstruct %int4_6787, %655, %int16_6788, %int32_6789, %int100_6790 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5367 = torch.aten.view %5365, %5366 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_6791 = torch.constant.int 1 %5368 = torch.aten.size.int %5367, %int1_6791 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_6792 = torch.constant.int 16 %5369 = torch.aten.mul.int %5368, %int16_6792 : !torch.int, !torch.int -> !torch.int %int4_6793 = torch.constant.int 4 %int32_6794 = torch.constant.int 32 %int100_6795 = torch.constant.int 100 %5370 = torch.prim.ListConstruct %int4_6793, %5369, %int32_6794, %int100_6795 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5371 = torch.aten.view %5367, %5370 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_6796 = torch.constant.int 0 %int0_6797 = torch.constant.int 0 %int9223372036854775807_6798 = torch.constant.int 9223372036854775807 %int1_6799 = torch.constant.int 1 %5372 = torch.aten.slice.Tensor %5112, %int0_6796, %int0_6797, %int9223372036854775807_6798, %int1_6799 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6800 = torch.constant.int 1 %int0_6801 = torch.constant.int 0 %int1_6802 = torch.constant.int 1 %5373 = torch.aten.slice.Tensor %5372, %int1_6800, %int0_6801, %5355, %int1_6802 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_6803 = torch.constant.bool false %5374 = torch.aten.copy %5373, %5371, %false_6803 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_6804 = torch.constant.int 0 %int0_6805 = torch.constant.int 0 %int9223372036854775807_6806 = torch.constant.int 9223372036854775807 %int1_6807 = torch.constant.int 1 %5375 = torch.aten.slice.Tensor %5112, %int0_6804, %int0_6805, %int9223372036854775807_6806, %int1_6807 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6808 = torch.constant.int 1 %int0_6809 = torch.constant.int 0 %int1_6810 = torch.constant.int 1 %5376 = torch.aten.slice_scatter %5375, %5374, %int1_6808, %int0_6809, %5355, %int1_6810 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_6811 = torch.constant.int 0 %int0_6812 = torch.constant.int 0 %int9223372036854775807_6813 = torch.constant.int 9223372036854775807 %int1_6814 = torch.constant.int 1 %5377 = torch.aten.slice_scatter %5112, %5376, %int0_6811, %int0_6812, %int9223372036854775807_6813, %int1_6814 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_6815 = torch.constant.int 0 %int0_6816 = torch.constant.int 0 %int9223372036854775807_6817 = torch.constant.int 9223372036854775807 %int1_6818 = torch.constant.int 1 %5378 = torch.aten.slice.Tensor %671, %int0_6815, %int0_6816, %int9223372036854775807_6817, %int1_6818 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6819 = torch.constant.int 1 %int0_6820 = torch.constant.int 0 %int1_6821 = torch.constant.int 1 %5379 = torch.aten.slice.Tensor %5378, %int1_6819, %int0_6820, %5355, %int1_6821 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_6822 = torch.constant.int 0 %int0_6823 = torch.constant.int 0 %int9223372036854775807_6824 = torch.constant.int 9223372036854775807 %int1_6825 = torch.constant.int 1 %5380 = torch.aten.slice.Tensor %673, %int0_6822, %int0_6823, %int9223372036854775807_6824, %int1_6825 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6826 = torch.constant.int 1 %int0_6827 = torch.constant.int 0 %int1_6828 = torch.constant.int 1 %5381 = torch.aten.slice.Tensor %5380, %int1_6826, %int0_6827, %5355, %int1_6828 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_6829 = torch.constant.int 1 %int2_6830 = torch.constant.int 2 %5382 = torch.aten.transpose.int %5218, %int1_6829, %int2_6830 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_6831 = torch.constant.int 4 %int32_6832 = torch.constant.int 32 %int1_6833 = torch.constant.int 1 %int100_6834 = torch.constant.int 100 %5383 = torch.prim.ListConstruct %int4_6831, %int32_6832, %int1_6833, %int100_6834 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6835 = torch.constant.bool false %5384 = torch.aten.expand %5382, %5383, %false_6835 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_6836 = torch.constant.int 128 %int1_6837 = torch.constant.int 1 %int100_6838 = torch.constant.int 100 %5385 = torch.prim.ListConstruct %int128_6836, %int1_6837, %int100_6838 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5386 = torch.aten.view %5384, %5385 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_6839 = torch.constant.int 0 %int0_6840 = torch.constant.int 0 %int9223372036854775807_6841 = torch.constant.int 9223372036854775807 %int1_6842 = torch.constant.int 1 %5387 = torch.aten.slice.Tensor %5360, %int0_6839, %int0_6840, %int9223372036854775807_6841, %int1_6842 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6843 = torch.constant.int 1 %int0_6844 = torch.constant.int 0 %int1_6845 = torch.constant.int 1 %5388 = torch.aten.slice.Tensor %5387, %int1_6843, %int0_6844, %5355, %int1_6845 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_6846 = torch.constant.int 1 %int2_6847 = torch.constant.int 2 %5389 = torch.aten.transpose.int %5388, %int1_6846, %int2_6847 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_6848 = torch.constant.int 2 %int3_6849 = torch.constant.int 3 %5390 = torch.aten.transpose.int %5389, %int2_6848, %int3_6849 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_6850 = torch.constant.int 1 %5391 = torch.aten.size.int %5379, %int1_6850 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_6851 = torch.constant.int 4 %int32_6852 = torch.constant.int 32 %int100_6853 = torch.constant.int 100 %5392 = torch.prim.ListConstruct %int4_6851, %int32_6852, %int100_6853, %5391 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6854 = torch.constant.bool false %5393 = torch.aten.expand %5390, %5392, %false_6854 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_6855 = torch.constant.int 0 %5394 = torch.aten.clone %5393, %int0_6855 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_6856 = torch.constant.int 128 %int100_6857 = torch.constant.int 100 %5395 = torch.prim.ListConstruct %int128_6856, %int100_6857, %5391 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5396 = torch.aten._unsafe_view %5394, %5395 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %5397 = torch.aten.bmm %5386, %5396 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_6858 = torch.constant.int 4 %int32_6859 = torch.constant.int 32 %int1_6860 = torch.constant.int 1 %5398 = torch.prim.ListConstruct %int4_6858, %int32_6859, %int1_6860, %5391 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5399 = torch.aten.view %5397, %5398 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_6861 = torch.constant.float 1.000000e+01 %5400 = torch.aten.div.Scalar %5399, %float1.000000e01_6861 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_6862 = torch.constant.int 1 %5401 = torch.aten.add.Tensor %5400, %895, %int1_6862 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_6863 = torch.constant.int -1 %false_6864 = torch.constant.bool false %5402 = torch.aten._softmax %5401, %int-1_6863, %false_6864 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_6865 = torch.constant.int 4 %int32_6866 = torch.constant.int 32 %int1_6867 = torch.constant.int 1 %5403 = torch.prim.ListConstruct %int4_6865, %int32_6866, %int1_6867, %5391 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6868 = torch.constant.bool false %5404 = torch.aten.expand %5402, %5403, %false_6868 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_6869 = torch.constant.int 128 %int1_6870 = torch.constant.int 1 %5405 = torch.prim.ListConstruct %int128_6869, %int1_6870, %5391 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5406 = torch.aten.view %5404, %5405 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_6871 = torch.constant.int 0 %int0_6872 = torch.constant.int 0 %int9223372036854775807_6873 = torch.constant.int 9223372036854775807 %int1_6874 = torch.constant.int 1 %5407 = torch.aten.slice.Tensor %5377, %int0_6871, %int0_6872, %int9223372036854775807_6873, %int1_6874 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_6875 = torch.constant.int 1 %int0_6876 = torch.constant.int 0 %int1_6877 = torch.constant.int 1 %5408 = torch.aten.slice.Tensor %5407, %int1_6875, %int0_6876, %5355, %int1_6877 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_6878 = torch.constant.int 1 %int2_6879 = torch.constant.int 2 %5409 = torch.aten.transpose.int %5408, %int1_6878, %int2_6879 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_6880 = torch.constant.int 1 %5410 = torch.aten.size.int %5381, %int1_6880 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_6881 = torch.constant.int 4 %int32_6882 = torch.constant.int 32 %int100_6883 = torch.constant.int 100 %5411 = torch.prim.ListConstruct %int4_6881, %int32_6882, %5410, %int100_6883 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_6884 = torch.constant.bool false %5412 = torch.aten.expand %5409, %5411, %false_6884 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_6885 = torch.constant.int 0 %5413 = torch.aten.clone %5412, %int0_6885 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_6886 = torch.constant.int 128 %int100_6887 = torch.constant.int 100 %5414 = torch.prim.ListConstruct %int128_6886, %5410, %int100_6887 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5415 = torch.aten._unsafe_view %5413, %5414 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %5416 = torch.aten.bmm %5406, %5415 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_6888 = torch.constant.int 4 %int32_6889 = torch.constant.int 32 %int1_6890 = torch.constant.int 1 %int100_6891 = torch.constant.int 100 %5417 = torch.prim.ListConstruct %int4_6888, %int32_6889, %int1_6890, %int100_6891 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5418 = torch.aten.view %5416, %5417 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_6892 = torch.constant.int 1 %int2_6893 = torch.constant.int 2 %5419 = torch.aten.transpose.int %5418, %int1_6892, %int2_6893 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_6894 = torch.constant.int 4 %int1_6895 = torch.constant.int 1 %int-1_6896 = torch.constant.int -1 %5420 = torch.prim.ListConstruct %int4_6894, %int1_6895, %int-1_6896 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5421 = torch.aten.view %5419, %5420 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %5422 = torch_c.to_builtin_tensor %5421 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6897 = tensor.cast %5422 : tensor<4x1x3200xf32> to tensor %5423 = torch_c.to_builtin_tensor %159 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5424 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6897, %5423) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6898 = tensor.cast %5424 : tensor to tensor<4x1x3200xf32> %5425 = torch_c.from_builtin_tensor %cast_6898 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_6899 = torch.constant.int 1 %5426 = torch.aten.add.Tensor %5183, %5425, %int1_6899 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_6900 = torch.constant.int 2 %5427 = torch.aten.pow.Tensor_Scalar %5426, %int2_6900 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_6901 = torch.constant.int -1 %5428 = torch.prim.ListConstruct %int-1_6901 : (!torch.int) -> !torch.list %true_6902 = torch.constant.bool true %none_6903 = torch.constant.none %5429 = torch.aten.mean.dim %5427, %5428, %true_6902, %none_6903 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_6904 = torch.constant.float 9.9999999747524271E-7 %int1_6905 = torch.constant.int 1 %5430 = torch.aten.add.Scalar %5429, %float9.999990e-07_6904, %int1_6905 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %5431 = torch.aten.rsqrt %5430 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %5432 = torch.aten.mul.Tensor %5426, %5431 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %5433 = torch.aten.mul.Tensor %5432, %160 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %5434 = torch_c.to_builtin_tensor %5433 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6906 = tensor.cast %5434 : tensor<4x1x3200xf32> to tensor %5435 = torch_c.to_builtin_tensor %161 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %5436 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_6906, %5435) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_6907 = tensor.cast %5436 : tensor to tensor<4x1x8640xf32> %5437 = torch_c.from_builtin_tensor %cast_6907 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %5438 = torch.aten.silu %5437 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %5439 = torch_c.to_builtin_tensor %5433 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6908 = tensor.cast %5439 : tensor<4x1x3200xf32> to tensor %5440 = torch_c.to_builtin_tensor %162 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %5441 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_6908, %5440) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_6909 = tensor.cast %5441 : tensor to tensor<4x1x8640xf32> %5442 = torch_c.from_builtin_tensor %cast_6909 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %5443 = torch.aten.mul.Tensor %5438, %5442 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %5444 = torch_c.to_builtin_tensor %5443 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_6910 = tensor.cast %5444 : tensor<4x1x8640xf32> to tensor %5445 = torch_c.to_builtin_tensor %163 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %5446 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_6910, %5445) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_6911 = tensor.cast %5446 : tensor to tensor<4x1x3200xf32> %5447 = torch_c.from_builtin_tensor %cast_6911 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_6912 = torch.constant.int 1 %5448 = torch.aten.add.Tensor %5426, %5447, %int1_6912 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_6913 = torch.constant.int 2 %5449 = torch.aten.pow.Tensor_Scalar %5448, %int2_6913 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_6914 = torch.constant.int -1 %5450 = torch.prim.ListConstruct %int-1_6914 : (!torch.int) -> !torch.list %true_6915 = torch.constant.bool true %none_6916 = torch.constant.none %5451 = torch.aten.mean.dim %5449, %5450, %true_6915, %none_6916 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_6917 = torch.constant.float 9.9999999747524271E-7 %int1_6918 = torch.constant.int 1 %5452 = torch.aten.add.Scalar %5451, %float9.999990e-07_6917, %int1_6918 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %5453 = torch.aten.rsqrt %5452 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %5454 = torch.aten.mul.Tensor %5448, %5453 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %5455 = torch.aten.mul.Tensor %5454, %164 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %5456 = torch_c.to_builtin_tensor %5455 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6919 = tensor.cast %5456 : tensor<4x1x3200xf32> to tensor %5457 = torch_c.to_builtin_tensor %165 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5458 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6919, %5457) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6920 = tensor.cast %5458 : tensor to tensor<4x1x3200xf32> %5459 = torch_c.from_builtin_tensor %cast_6920 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %5460 = torch_c.to_builtin_tensor %5455 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6921 = tensor.cast %5460 : tensor<4x1x3200xf32> to tensor %5461 = torch_c.to_builtin_tensor %166 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5462 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6921, %5461) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6922 = tensor.cast %5462 : tensor to tensor<4x1x3200xf32> %5463 = torch_c.from_builtin_tensor %cast_6922 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %5464 = torch_c.to_builtin_tensor %5455 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_6923 = tensor.cast %5464 : tensor<4x1x3200xf32> to tensor %5465 = torch_c.to_builtin_tensor %167 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5466 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_6923, %5465) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_6924 = tensor.cast %5466 : tensor to tensor<4x1x3200xf32> %5467 = torch_c.from_builtin_tensor %cast_6924 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_6925 = torch.constant.int 4 %int1_6926 = torch.constant.int 1 %int32_6927 = torch.constant.int 32 %int100_6928 = torch.constant.int 100 %5468 = torch.prim.ListConstruct %int4_6925, %int1_6926, %int32_6927, %int100_6928 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5469 = torch.aten.view %5459, %5468 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_6929 = torch.constant.int 4 %int1_6930 = torch.constant.int 1 %int32_6931 = torch.constant.int 32 %int100_6932 = torch.constant.int 100 %5470 = torch.prim.ListConstruct %int4_6929, %int1_6930, %int32_6931, %int100_6932 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5471 = torch.aten.view %5463, %5470 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_6933 = torch.constant.int 4 %int1_6934 = torch.constant.int 1 %int32_6935 = torch.constant.int 32 %int100_6936 = torch.constant.int 100 %5472 = torch.prim.ListConstruct %int4_6933, %int1_6934, %int32_6935, %int100_6936 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5473 = torch.aten.view %5467, %5472 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_6937 = torch.constant.int 4 %int1_6938 = torch.constant.int 1 %int32_6939 = torch.constant.int 32 %int-1_6940 = torch.constant.int -1 %int2_6941 = torch.constant.int 2 %5474 = torch.prim.ListConstruct %int4_6937, %int1_6938, %int32_6939, %int-1_6940, %int2_6941 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5475 = torch.aten.view %5469, %5474 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %5476 = torch.aten.view_as_complex %5475 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_6942 = torch.constant.int 4 %int1_6943 = torch.constant.int 1 %int32_6944 = torch.constant.int 32 %int-1_6945 = torch.constant.int -1 %int2_6946 = torch.constant.int 2 %5477 = torch.prim.ListConstruct %int4_6942, %int1_6943, %int32_6944, %int-1_6945, %int2_6946 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5478 = torch.aten.view %5471, %5477 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %5479 = torch.aten.view_as_complex %5478 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %5480 = torch.aten.mul.Tensor %5476, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %5481 = torch.aten.view_as_real %5480 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_6947 = torch.constant.int 4 %int1_6948 = torch.constant.int 1 %int32_6949 = torch.constant.int 32 %int100_6950 = torch.constant.int 100 %5482 = torch.prim.ListConstruct %int4_6947, %int1_6948, %int32_6949, %int100_6950 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5483 = torch.aten.view %5481, %5482 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %5484 = torch.aten.mul.Tensor %5479, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %5485 = torch.aten.view_as_real %5484 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_6951 = torch.constant.int 4 %int1_6952 = torch.constant.int 1 %int32_6953 = torch.constant.int 32 %int100_6954 = torch.constant.int 100 %5486 = torch.prim.ListConstruct %int4_6951, %int1_6952, %int32_6953, %int100_6954 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5487 = torch.aten.view %5485, %5486 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_6955 = torch.constant.int 1 %int1_6956 = torch.constant.int 1 %5488 = torch.aten.add.Scalar %arg2, %int1_6955, %int1_6956 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_6957 = torch.constant.int 0 %int0_6958 = torch.constant.int 0 %5489 = torch.aten.select.int %5488, %int0_6957, %int0_6958 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_6959 = torch.constant.int 0 %int0_6960 = torch.constant.int 0 %5490 = torch.aten.select.int %arg3, %int0_6959, %int0_6960 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_6961 = torch.constant.int 0 %int0_6962 = torch.constant.int 0 %int9223372036854775807_6963 = torch.constant.int 9223372036854775807 %int1_6964 = torch.constant.int 1 %5491 = torch.aten.slice.Tensor %5490, %int0_6961, %int0_6962, %int9223372036854775807_6963, %int1_6964 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_6965 = torch.constant.int 16 %5492 = torch.aten.floor_divide.Scalar %5489, %int16_6965 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_6966 = torch.constant.int 0 %5493 = torch.aten.index_select %5491, %int0_6966, %5492 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_6967 = torch.constant.int 16 %5494 = torch.aten.remainder.Scalar %5489, %int16_6967 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_6968 = torch.constant.none %5495 = torch.aten.clone %526, %none_6968 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6969 = torch.constant.none %5496 = torch.aten.clone %527, %none_6969 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6970 = torch.constant.int 0 %5497 = torch.aten.unsqueeze %5494, %int0_6970 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6971 = torch.constant.int 0 %int0_6972 = torch.constant.int 0 %5498 = torch.aten.select.int %5487, %int0_6971, %int0_6972 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6973 = torch.constant.int 0 %int0_6974 = torch.constant.int 0 %5499 = torch.aten.select.int %5498, %int0_6973, %int0_6974 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_6975 = torch.constant.int -1 %int26_6976 = torch.constant.int 26 %int2_6977 = torch.constant.int 2 %int16_6978 = torch.constant.int 16 %int32_6979 = torch.constant.int 32 %int100_6980 = torch.constant.int 100 %5500 = torch.prim.ListConstruct %int-1_6975, %int26_6976, %int2_6977, %int16_6978, %int32_6979, %int100_6980 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5501 = torch.aten.view %5335, %5500 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %5502 = torch.prim.ListConstruct %5493, %5495, %5496, %5497 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6981 = torch.constant.bool false %5503 = torch.aten.index_put %5501, %5502, %5499, %false_6981 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6982 = torch.constant.int 2662400 %5504 = torch.prim.ListConstruct %731, %int2662400_6982 : (!torch.int, !torch.int) -> !torch.list %5505 = torch.aten.view %5503, %5504 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6983 = torch.constant.int -1 %int26_6984 = torch.constant.int 26 %int2_6985 = torch.constant.int 2 %int16_6986 = torch.constant.int 16 %int32_6987 = torch.constant.int 32 %int100_6988 = torch.constant.int 100 %5506 = torch.prim.ListConstruct %int-1_6983, %int26_6984, %int2_6985, %int16_6986, %int32_6987, %int100_6988 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5507 = torch.aten.view %5505, %5506 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_6989 = torch.constant.none %5508 = torch.aten.clone %528, %none_6989 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_6990 = torch.constant.none %5509 = torch.aten.clone %529, %none_6990 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_6991 = torch.constant.int 0 %5510 = torch.aten.unsqueeze %5494, %int0_6991 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_6992 = torch.constant.int 0 %int0_6993 = torch.constant.int 0 %5511 = torch.aten.select.int %5473, %int0_6992, %int0_6993 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_6994 = torch.constant.int 0 %int0_6995 = torch.constant.int 0 %5512 = torch.aten.select.int %5511, %int0_6994, %int0_6995 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5513 = torch.prim.ListConstruct %5493, %5508, %5509, %5510 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_6996 = torch.constant.bool false %5514 = torch.aten.index_put %5507, %5513, %5512, %false_6996 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_6997 = torch.constant.int 2662400 %5515 = torch.prim.ListConstruct %731, %int2662400_6997 : (!torch.int, !torch.int) -> !torch.list %5516 = torch.aten.view %5514, %5515 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_6998 = torch.constant.int -1 %int26_6999 = torch.constant.int 26 %int2_7000 = torch.constant.int 2 %int16_7001 = torch.constant.int 16 %int32_7002 = torch.constant.int 32 %int100_7003 = torch.constant.int 100 %5517 = torch.prim.ListConstruct %int-1_6998, %int26_6999, %int2_7000, %int16_7001, %int32_7002, %int100_7003 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5518 = torch.aten.view %5516, %5517 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_7004 = torch.constant.int 0 %int1_7005 = torch.constant.int 1 %5519 = torch.aten.select.int %5488, %int0_7004, %int1_7005 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7006 = torch.constant.int 0 %int1_7007 = torch.constant.int 1 %5520 = torch.aten.select.int %arg3, %int0_7006, %int1_7007 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7008 = torch.constant.int 0 %int0_7009 = torch.constant.int 0 %int9223372036854775807_7010 = torch.constant.int 9223372036854775807 %int1_7011 = torch.constant.int 1 %5521 = torch.aten.slice.Tensor %5520, %int0_7008, %int0_7009, %int9223372036854775807_7010, %int1_7011 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7012 = torch.constant.int 16 %5522 = torch.aten.floor_divide.Scalar %5519, %int16_7012 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7013 = torch.constant.int 0 %5523 = torch.aten.index_select %5521, %int0_7013, %5522 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7014 = torch.constant.int 16 %5524 = torch.aten.remainder.Scalar %5519, %int16_7014 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7015 = torch.constant.none %5525 = torch.aten.clone %530, %none_7015 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7016 = torch.constant.none %5526 = torch.aten.clone %531, %none_7016 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7017 = torch.constant.int 0 %5527 = torch.aten.unsqueeze %5524, %int0_7017 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7018 = torch.constant.int 0 %int1_7019 = torch.constant.int 1 %5528 = torch.aten.select.int %5487, %int0_7018, %int1_7019 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7020 = torch.constant.int 0 %int0_7021 = torch.constant.int 0 %5529 = torch.aten.select.int %5528, %int0_7020, %int0_7021 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5530 = torch.prim.ListConstruct %5523, %5525, %5526, %5527 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7022 = torch.constant.bool false %5531 = torch.aten.index_put %5518, %5530, %5529, %false_7022 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7023 = torch.constant.int 2662400 %5532 = torch.prim.ListConstruct %731, %int2662400_7023 : (!torch.int, !torch.int) -> !torch.list %5533 = torch.aten.view %5531, %5532 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7024 = torch.constant.int -1 %int26_7025 = torch.constant.int 26 %int2_7026 = torch.constant.int 2 %int16_7027 = torch.constant.int 16 %int32_7028 = torch.constant.int 32 %int100_7029 = torch.constant.int 100 %5534 = torch.prim.ListConstruct %int-1_7024, %int26_7025, %int2_7026, %int16_7027, %int32_7028, %int100_7029 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5535 = torch.aten.view %5533, %5534 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7030 = torch.constant.none %5536 = torch.aten.clone %532, %none_7030 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7031 = torch.constant.none %5537 = torch.aten.clone %533, %none_7031 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7032 = torch.constant.int 0 %5538 = torch.aten.unsqueeze %5524, %int0_7032 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7033 = torch.constant.int 0 %int1_7034 = torch.constant.int 1 %5539 = torch.aten.select.int %5473, %int0_7033, %int1_7034 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7035 = torch.constant.int 0 %int0_7036 = torch.constant.int 0 %5540 = torch.aten.select.int %5539, %int0_7035, %int0_7036 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5541 = torch.prim.ListConstruct %5523, %5536, %5537, %5538 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7037 = torch.constant.bool false %5542 = torch.aten.index_put %5535, %5541, %5540, %false_7037 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7038 = torch.constant.int 2662400 %5543 = torch.prim.ListConstruct %731, %int2662400_7038 : (!torch.int, !torch.int) -> !torch.list %5544 = torch.aten.view %5542, %5543 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7039 = torch.constant.int -1 %int26_7040 = torch.constant.int 26 %int2_7041 = torch.constant.int 2 %int16_7042 = torch.constant.int 16 %int32_7043 = torch.constant.int 32 %int100_7044 = torch.constant.int 100 %5545 = torch.prim.ListConstruct %int-1_7039, %int26_7040, %int2_7041, %int16_7042, %int32_7043, %int100_7044 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5546 = torch.aten.view %5544, %5545 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_7045 = torch.constant.int 0 %int2_7046 = torch.constant.int 2 %5547 = torch.aten.select.int %5488, %int0_7045, %int2_7046 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7047 = torch.constant.int 0 %int2_7048 = torch.constant.int 2 %5548 = torch.aten.select.int %arg3, %int0_7047, %int2_7048 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7049 = torch.constant.int 0 %int0_7050 = torch.constant.int 0 %int9223372036854775807_7051 = torch.constant.int 9223372036854775807 %int1_7052 = torch.constant.int 1 %5549 = torch.aten.slice.Tensor %5548, %int0_7049, %int0_7050, %int9223372036854775807_7051, %int1_7052 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7053 = torch.constant.int 16 %5550 = torch.aten.floor_divide.Scalar %5547, %int16_7053 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7054 = torch.constant.int 0 %5551 = torch.aten.index_select %5549, %int0_7054, %5550 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7055 = torch.constant.int 16 %5552 = torch.aten.remainder.Scalar %5547, %int16_7055 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7056 = torch.constant.none %5553 = torch.aten.clone %534, %none_7056 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7057 = torch.constant.none %5554 = torch.aten.clone %535, %none_7057 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7058 = torch.constant.int 0 %5555 = torch.aten.unsqueeze %5552, %int0_7058 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7059 = torch.constant.int 0 %int2_7060 = torch.constant.int 2 %5556 = torch.aten.select.int %5487, %int0_7059, %int2_7060 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7061 = torch.constant.int 0 %int0_7062 = torch.constant.int 0 %5557 = torch.aten.select.int %5556, %int0_7061, %int0_7062 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5558 = torch.prim.ListConstruct %5551, %5553, %5554, %5555 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7063 = torch.constant.bool false %5559 = torch.aten.index_put %5546, %5558, %5557, %false_7063 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7064 = torch.constant.int 2662400 %5560 = torch.prim.ListConstruct %731, %int2662400_7064 : (!torch.int, !torch.int) -> !torch.list %5561 = torch.aten.view %5559, %5560 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7065 = torch.constant.int -1 %int26_7066 = torch.constant.int 26 %int2_7067 = torch.constant.int 2 %int16_7068 = torch.constant.int 16 %int32_7069 = torch.constant.int 32 %int100_7070 = torch.constant.int 100 %5562 = torch.prim.ListConstruct %int-1_7065, %int26_7066, %int2_7067, %int16_7068, %int32_7069, %int100_7070 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5563 = torch.aten.view %5561, %5562 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7071 = torch.constant.none %5564 = torch.aten.clone %536, %none_7071 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7072 = torch.constant.none %5565 = torch.aten.clone %537, %none_7072 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7073 = torch.constant.int 0 %5566 = torch.aten.unsqueeze %5552, %int0_7073 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7074 = torch.constant.int 0 %int2_7075 = torch.constant.int 2 %5567 = torch.aten.select.int %5473, %int0_7074, %int2_7075 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7076 = torch.constant.int 0 %int0_7077 = torch.constant.int 0 %5568 = torch.aten.select.int %5567, %int0_7076, %int0_7077 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5569 = torch.prim.ListConstruct %5551, %5564, %5565, %5566 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7078 = torch.constant.bool false %5570 = torch.aten.index_put %5563, %5569, %5568, %false_7078 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7079 = torch.constant.int 2662400 %5571 = torch.prim.ListConstruct %731, %int2662400_7079 : (!torch.int, !torch.int) -> !torch.list %5572 = torch.aten.view %5570, %5571 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7080 = torch.constant.int -1 %int26_7081 = torch.constant.int 26 %int2_7082 = torch.constant.int 2 %int16_7083 = torch.constant.int 16 %int32_7084 = torch.constant.int 32 %int100_7085 = torch.constant.int 100 %5573 = torch.prim.ListConstruct %int-1_7080, %int26_7081, %int2_7082, %int16_7083, %int32_7084, %int100_7085 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5574 = torch.aten.view %5572, %5573 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_7086 = torch.constant.int 0 %int3_7087 = torch.constant.int 3 %5575 = torch.aten.select.int %5488, %int0_7086, %int3_7087 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7088 = torch.constant.int 0 %int3_7089 = torch.constant.int 3 %5576 = torch.aten.select.int %arg3, %int0_7088, %int3_7089 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7090 = torch.constant.int 0 %int0_7091 = torch.constant.int 0 %int9223372036854775807_7092 = torch.constant.int 9223372036854775807 %int1_7093 = torch.constant.int 1 %5577 = torch.aten.slice.Tensor %5576, %int0_7090, %int0_7091, %int9223372036854775807_7092, %int1_7093 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7094 = torch.constant.int 16 %5578 = torch.aten.floor_divide.Scalar %5575, %int16_7094 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7095 = torch.constant.int 0 %5579 = torch.aten.index_select %5577, %int0_7095, %5578 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7096 = torch.constant.int 16 %5580 = torch.aten.remainder.Scalar %5575, %int16_7096 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7097 = torch.constant.none %5581 = torch.aten.clone %538, %none_7097 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7098 = torch.constant.none %5582 = torch.aten.clone %539, %none_7098 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7099 = torch.constant.int 0 %5583 = torch.aten.unsqueeze %5580, %int0_7099 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7100 = torch.constant.int 0 %int3_7101 = torch.constant.int 3 %5584 = torch.aten.select.int %5487, %int0_7100, %int3_7101 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7102 = torch.constant.int 0 %int0_7103 = torch.constant.int 0 %5585 = torch.aten.select.int %5584, %int0_7102, %int0_7103 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5586 = torch.prim.ListConstruct %5579, %5581, %5582, %5583 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7104 = torch.constant.bool false %5587 = torch.aten.index_put %5574, %5586, %5585, %false_7104 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7105 = torch.constant.int 2662400 %5588 = torch.prim.ListConstruct %731, %int2662400_7105 : (!torch.int, !torch.int) -> !torch.list %5589 = torch.aten.view %5587, %5588 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7106 = torch.constant.int -1 %int26_7107 = torch.constant.int 26 %int2_7108 = torch.constant.int 2 %int16_7109 = torch.constant.int 16 %int32_7110 = torch.constant.int 32 %int100_7111 = torch.constant.int 100 %5590 = torch.prim.ListConstruct %int-1_7106, %int26_7107, %int2_7108, %int16_7109, %int32_7110, %int100_7111 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5591 = torch.aten.view %5589, %5590 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7112 = torch.constant.none %5592 = torch.aten.clone %540, %none_7112 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7113 = torch.constant.none %5593 = torch.aten.clone %541, %none_7113 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7114 = torch.constant.int 0 %5594 = torch.aten.unsqueeze %5580, %int0_7114 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7115 = torch.constant.int 0 %int3_7116 = torch.constant.int 3 %5595 = torch.aten.select.int %5473, %int0_7115, %int3_7116 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7117 = torch.constant.int 0 %int0_7118 = torch.constant.int 0 %5596 = torch.aten.select.int %5595, %int0_7117, %int0_7118 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5597 = torch.prim.ListConstruct %5579, %5592, %5593, %5594 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7119 = torch.constant.bool false %5598 = torch.aten.index_put %5591, %5597, %5596, %false_7119 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7120 = torch.constant.int 2662400 %5599 = torch.prim.ListConstruct %731, %int2662400_7120 : (!torch.int, !torch.int) -> !torch.list %5600 = torch.aten.view %5598, %5599 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_7121 = torch.constant.int 52 %5601 = torch.aten.mul.Scalar %arg3, %int52_7121 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int36 = torch.constant.int 36 %int1_7122 = torch.constant.int 1 %5602 = torch.aten.add.Scalar %5601, %int36, %int1_7122 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_7123 = torch.constant.int 4 %5603 = torch.aten.mul.int %int4_7123, %655 : !torch.int, !torch.int -> !torch.int %5604 = torch.prim.ListConstruct %5603 : (!torch.int) -> !torch.list %5605 = torch.aten.view %5602, %5604 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_7124 = torch.constant.int -1 %int26_7125 = torch.constant.int 26 %int2_7126 = torch.constant.int 2 %int16_7127 = torch.constant.int 16 %int32_7128 = torch.constant.int 32 %int100_7129 = torch.constant.int 100 %5606 = torch.prim.ListConstruct %int-1_7124, %int26_7125, %int2_7126, %int16_7127, %int32_7128, %int100_7129 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5607 = torch.aten.view %5600, %5606 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_7130 = torch.constant.int 26 %5608 = torch.aten.mul.int %731, %int26_7130 : !torch.int, !torch.int -> !torch.int %int2_7131 = torch.constant.int 2 %5609 = torch.aten.mul.int %5608, %int2_7131 : !torch.int, !torch.int -> !torch.int %int16_7132 = torch.constant.int 16 %int32_7133 = torch.constant.int 32 %int100_7134 = torch.constant.int 100 %5610 = torch.prim.ListConstruct %5609, %int16_7132, %int32_7133, %int100_7134 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5611 = torch.aten.view %5607, %5610 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_7135 = torch.constant.int 0 %5612 = torch.aten.index_select %5611, %int0_7135, %5605 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_7136 = torch.constant.int 4 %int16_7137 = torch.constant.int 16 %int32_7138 = torch.constant.int 32 %int100_7139 = torch.constant.int 100 %5613 = torch.prim.ListConstruct %int4_7136, %655, %int16_7137, %int32_7138, %int100_7139 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5614 = torch.aten.view %5612, %5613 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_7140 = torch.constant.int 1 %5615 = torch.aten.size.int %5614, %int1_7140 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_7141 = torch.constant.int 16 %5616 = torch.aten.mul.int %5615, %int16_7141 : !torch.int, !torch.int -> !torch.int %int4_7142 = torch.constant.int 4 %int32_7143 = torch.constant.int 32 %int100_7144 = torch.constant.int 100 %5617 = torch.prim.ListConstruct %int4_7142, %5616, %int32_7143, %int100_7144 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5618 = torch.aten.view %5614, %5617 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_7145 = torch.constant.int 0 %int0_7146 = torch.constant.int 0 %int9223372036854775807_7147 = torch.constant.int 9223372036854775807 %int1_7148 = torch.constant.int 1 %5619 = torch.aten.slice.Tensor %5360, %int0_7145, %int0_7146, %int9223372036854775807_7147, %int1_7148 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_7149 = torch.constant.int 16 %5620 = torch.aten.mul.int %655, %int16_7149 : !torch.int, !torch.int -> !torch.int %int1_7150 = torch.constant.int 1 %int0_7151 = torch.constant.int 0 %int1_7152 = torch.constant.int 1 %5621 = torch.aten.slice.Tensor %5619, %int1_7150, %int0_7151, %5620, %int1_7152 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_7153 = torch.constant.bool false %5622 = torch.aten.copy %5621, %5618, %false_7153 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_7154 = torch.constant.int 0 %int0_7155 = torch.constant.int 0 %int9223372036854775807_7156 = torch.constant.int 9223372036854775807 %int1_7157 = torch.constant.int 1 %5623 = torch.aten.slice.Tensor %5360, %int0_7154, %int0_7155, %int9223372036854775807_7156, %int1_7157 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7158 = torch.constant.int 1 %int0_7159 = torch.constant.int 0 %int1_7160 = torch.constant.int 1 %5624 = torch.aten.slice_scatter %5623, %5622, %int1_7158, %int0_7159, %5620, %int1_7160 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_7161 = torch.constant.int 0 %int0_7162 = torch.constant.int 0 %int9223372036854775807_7163 = torch.constant.int 9223372036854775807 %int1_7164 = torch.constant.int 1 %5625 = torch.aten.slice_scatter %5360, %5624, %int0_7161, %int0_7162, %int9223372036854775807_7163, %int1_7164 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7165 = torch.constant.int 1 %int1_7166 = torch.constant.int 1 %5626 = torch.aten.add.Scalar %5602, %int1_7165, %int1_7166 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_7167 = torch.constant.int 4 %5627 = torch.aten.mul.int %int4_7167, %655 : !torch.int, !torch.int -> !torch.int %5628 = torch.prim.ListConstruct %5627 : (!torch.int) -> !torch.list %5629 = torch.aten.view %5626, %5628 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_7168 = torch.constant.int 0 %5630 = torch.aten.index_select %5611, %int0_7168, %5629 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_7169 = torch.constant.int 4 %int16_7170 = torch.constant.int 16 %int32_7171 = torch.constant.int 32 %int100_7172 = torch.constant.int 100 %5631 = torch.prim.ListConstruct %int4_7169, %655, %int16_7170, %int32_7171, %int100_7172 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5632 = torch.aten.view %5630, %5631 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_7173 = torch.constant.int 1 %5633 = torch.aten.size.int %5632, %int1_7173 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_7174 = torch.constant.int 16 %5634 = torch.aten.mul.int %5633, %int16_7174 : !torch.int, !torch.int -> !torch.int %int4_7175 = torch.constant.int 4 %int32_7176 = torch.constant.int 32 %int100_7177 = torch.constant.int 100 %5635 = torch.prim.ListConstruct %int4_7175, %5634, %int32_7176, %int100_7177 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5636 = torch.aten.view %5632, %5635 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_7178 = torch.constant.int 0 %int0_7179 = torch.constant.int 0 %int9223372036854775807_7180 = torch.constant.int 9223372036854775807 %int1_7181 = torch.constant.int 1 %5637 = torch.aten.slice.Tensor %5377, %int0_7178, %int0_7179, %int9223372036854775807_7180, %int1_7181 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7182 = torch.constant.int 1 %int0_7183 = torch.constant.int 0 %int1_7184 = torch.constant.int 1 %5638 = torch.aten.slice.Tensor %5637, %int1_7182, %int0_7183, %5620, %int1_7184 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_7185 = torch.constant.bool false %5639 = torch.aten.copy %5638, %5636, %false_7185 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_7186 = torch.constant.int 0 %int0_7187 = torch.constant.int 0 %int9223372036854775807_7188 = torch.constant.int 9223372036854775807 %int1_7189 = torch.constant.int 1 %5640 = torch.aten.slice.Tensor %5377, %int0_7186, %int0_7187, %int9223372036854775807_7188, %int1_7189 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7190 = torch.constant.int 1 %int0_7191 = torch.constant.int 0 %int1_7192 = torch.constant.int 1 %5641 = torch.aten.slice_scatter %5640, %5639, %int1_7190, %int0_7191, %5620, %int1_7192 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_7193 = torch.constant.int 0 %int0_7194 = torch.constant.int 0 %int9223372036854775807_7195 = torch.constant.int 9223372036854775807 %int1_7196 = torch.constant.int 1 %5642 = torch.aten.slice_scatter %5377, %5641, %int0_7193, %int0_7194, %int9223372036854775807_7195, %int1_7196 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_7197 = torch.constant.int 0 %int0_7198 = torch.constant.int 0 %int9223372036854775807_7199 = torch.constant.int 9223372036854775807 %int1_7200 = torch.constant.int 1 %5643 = torch.aten.slice.Tensor %671, %int0_7197, %int0_7198, %int9223372036854775807_7199, %int1_7200 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7201 = torch.constant.int 1 %int0_7202 = torch.constant.int 0 %int1_7203 = torch.constant.int 1 %5644 = torch.aten.slice.Tensor %5643, %int1_7201, %int0_7202, %5620, %int1_7203 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_7204 = torch.constant.int 0 %int0_7205 = torch.constant.int 0 %int9223372036854775807_7206 = torch.constant.int 9223372036854775807 %int1_7207 = torch.constant.int 1 %5645 = torch.aten.slice.Tensor %673, %int0_7204, %int0_7205, %int9223372036854775807_7206, %int1_7207 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7208 = torch.constant.int 1 %int0_7209 = torch.constant.int 0 %int1_7210 = torch.constant.int 1 %5646 = torch.aten.slice.Tensor %5645, %int1_7208, %int0_7209, %5620, %int1_7210 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_7211 = torch.constant.int 1 %int2_7212 = torch.constant.int 2 %5647 = torch.aten.transpose.int %5483, %int1_7211, %int2_7212 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_7213 = torch.constant.int 4 %int32_7214 = torch.constant.int 32 %int1_7215 = torch.constant.int 1 %int100_7216 = torch.constant.int 100 %5648 = torch.prim.ListConstruct %int4_7213, %int32_7214, %int1_7215, %int100_7216 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_7217 = torch.constant.bool false %5649 = torch.aten.expand %5647, %5648, %false_7217 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_7218 = torch.constant.int 128 %int1_7219 = torch.constant.int 1 %int100_7220 = torch.constant.int 100 %5650 = torch.prim.ListConstruct %int128_7218, %int1_7219, %int100_7220 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5651 = torch.aten.view %5649, %5650 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_7221 = torch.constant.int 0 %int0_7222 = torch.constant.int 0 %int9223372036854775807_7223 = torch.constant.int 9223372036854775807 %int1_7224 = torch.constant.int 1 %5652 = torch.aten.slice.Tensor %5625, %int0_7221, %int0_7222, %int9223372036854775807_7223, %int1_7224 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7225 = torch.constant.int 1 %int0_7226 = torch.constant.int 0 %int1_7227 = torch.constant.int 1 %5653 = torch.aten.slice.Tensor %5652, %int1_7225, %int0_7226, %5620, %int1_7227 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_7228 = torch.constant.int 1 %int2_7229 = torch.constant.int 2 %5654 = torch.aten.transpose.int %5653, %int1_7228, %int2_7229 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_7230 = torch.constant.int 2 %int3_7231 = torch.constant.int 3 %5655 = torch.aten.transpose.int %5654, %int2_7230, %int3_7231 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_7232 = torch.constant.int 1 %5656 = torch.aten.size.int %5644, %int1_7232 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_7233 = torch.constant.int 4 %int32_7234 = torch.constant.int 32 %int100_7235 = torch.constant.int 100 %5657 = torch.prim.ListConstruct %int4_7233, %int32_7234, %int100_7235, %5656 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_7236 = torch.constant.bool false %5658 = torch.aten.expand %5655, %5657, %false_7236 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_7237 = torch.constant.int 0 %5659 = torch.aten.clone %5658, %int0_7237 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_7238 = torch.constant.int 128 %int100_7239 = torch.constant.int 100 %5660 = torch.prim.ListConstruct %int128_7238, %int100_7239, %5656 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5661 = torch.aten._unsafe_view %5659, %5660 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %5662 = torch.aten.bmm %5651, %5661 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_7240 = torch.constant.int 4 %int32_7241 = torch.constant.int 32 %int1_7242 = torch.constant.int 1 %5663 = torch.prim.ListConstruct %int4_7240, %int32_7241, %int1_7242, %5656 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5664 = torch.aten.view %5662, %5663 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_7243 = torch.constant.float 1.000000e+01 %5665 = torch.aten.div.Scalar %5664, %float1.000000e01_7243 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_7244 = torch.constant.int 1 %5666 = torch.aten.add.Tensor %5665, %895, %int1_7244 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_7245 = torch.constant.int -1 %false_7246 = torch.constant.bool false %5667 = torch.aten._softmax %5666, %int-1_7245, %false_7246 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_7247 = torch.constant.int 4 %int32_7248 = torch.constant.int 32 %int1_7249 = torch.constant.int 1 %5668 = torch.prim.ListConstruct %int4_7247, %int32_7248, %int1_7249, %5656 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_7250 = torch.constant.bool false %5669 = torch.aten.expand %5667, %5668, %false_7250 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_7251 = torch.constant.int 128 %int1_7252 = torch.constant.int 1 %5670 = torch.prim.ListConstruct %int128_7251, %int1_7252, %5656 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5671 = torch.aten.view %5669, %5670 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_7253 = torch.constant.int 0 %int0_7254 = torch.constant.int 0 %int9223372036854775807_7255 = torch.constant.int 9223372036854775807 %int1_7256 = torch.constant.int 1 %5672 = torch.aten.slice.Tensor %5642, %int0_7253, %int0_7254, %int9223372036854775807_7255, %int1_7256 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7257 = torch.constant.int 1 %int0_7258 = torch.constant.int 0 %int1_7259 = torch.constant.int 1 %5673 = torch.aten.slice.Tensor %5672, %int1_7257, %int0_7258, %5620, %int1_7259 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_7260 = torch.constant.int 1 %int2_7261 = torch.constant.int 2 %5674 = torch.aten.transpose.int %5673, %int1_7260, %int2_7261 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_7262 = torch.constant.int 1 %5675 = torch.aten.size.int %5646, %int1_7262 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_7263 = torch.constant.int 4 %int32_7264 = torch.constant.int 32 %int100_7265 = torch.constant.int 100 %5676 = torch.prim.ListConstruct %int4_7263, %int32_7264, %5675, %int100_7265 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_7266 = torch.constant.bool false %5677 = torch.aten.expand %5674, %5676, %false_7266 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_7267 = torch.constant.int 0 %5678 = torch.aten.clone %5677, %int0_7267 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_7268 = torch.constant.int 128 %int100_7269 = torch.constant.int 100 %5679 = torch.prim.ListConstruct %int128_7268, %5675, %int100_7269 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5680 = torch.aten._unsafe_view %5678, %5679 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %5681 = torch.aten.bmm %5671, %5680 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_7270 = torch.constant.int 4 %int32_7271 = torch.constant.int 32 %int1_7272 = torch.constant.int 1 %int100_7273 = torch.constant.int 100 %5682 = torch.prim.ListConstruct %int4_7270, %int32_7271, %int1_7272, %int100_7273 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5683 = torch.aten.view %5681, %5682 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_7274 = torch.constant.int 1 %int2_7275 = torch.constant.int 2 %5684 = torch.aten.transpose.int %5683, %int1_7274, %int2_7275 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_7276 = torch.constant.int 4 %int1_7277 = torch.constant.int 1 %int-1_7278 = torch.constant.int -1 %5685 = torch.prim.ListConstruct %int4_7276, %int1_7277, %int-1_7278 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5686 = torch.aten.view %5684, %5685 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %5687 = torch_c.to_builtin_tensor %5686 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7279 = tensor.cast %5687 : tensor<4x1x3200xf32> to tensor %5688 = torch_c.to_builtin_tensor %168 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5689 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_7279, %5688) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_7280 = tensor.cast %5689 : tensor to tensor<4x1x3200xf32> %5690 = torch_c.from_builtin_tensor %cast_7280 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_7281 = torch.constant.int 1 %5691 = torch.aten.add.Tensor %5448, %5690, %int1_7281 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_7282 = torch.constant.int 2 %5692 = torch.aten.pow.Tensor_Scalar %5691, %int2_7282 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_7283 = torch.constant.int -1 %5693 = torch.prim.ListConstruct %int-1_7283 : (!torch.int) -> !torch.list %true_7284 = torch.constant.bool true %none_7285 = torch.constant.none %5694 = torch.aten.mean.dim %5692, %5693, %true_7284, %none_7285 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_7286 = torch.constant.float 9.9999999747524271E-7 %int1_7287 = torch.constant.int 1 %5695 = torch.aten.add.Scalar %5694, %float9.999990e-07_7286, %int1_7287 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %5696 = torch.aten.rsqrt %5695 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %5697 = torch.aten.mul.Tensor %5691, %5696 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %5698 = torch.aten.mul.Tensor %5697, %169 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %5699 = torch_c.to_builtin_tensor %5698 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7288 = tensor.cast %5699 : tensor<4x1x3200xf32> to tensor %5700 = torch_c.to_builtin_tensor %170 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %5701 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_7288, %5700) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_7289 = tensor.cast %5701 : tensor to tensor<4x1x8640xf32> %5702 = torch_c.from_builtin_tensor %cast_7289 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %5703 = torch.aten.silu %5702 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %5704 = torch_c.to_builtin_tensor %5698 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7290 = tensor.cast %5704 : tensor<4x1x3200xf32> to tensor %5705 = torch_c.to_builtin_tensor %171 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %5706 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_7290, %5705) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_7291 = tensor.cast %5706 : tensor to tensor<4x1x8640xf32> %5707 = torch_c.from_builtin_tensor %cast_7291 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %5708 = torch.aten.mul.Tensor %5703, %5707 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %5709 = torch_c.to_builtin_tensor %5708 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_7292 = tensor.cast %5709 : tensor<4x1x8640xf32> to tensor %5710 = torch_c.to_builtin_tensor %172 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %5711 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_7292, %5710) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_7293 = tensor.cast %5711 : tensor to tensor<4x1x3200xf32> %5712 = torch_c.from_builtin_tensor %cast_7293 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_7294 = torch.constant.int 1 %5713 = torch.aten.add.Tensor %5691, %5712, %int1_7294 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_7295 = torch.constant.int 2 %5714 = torch.aten.pow.Tensor_Scalar %5713, %int2_7295 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_7296 = torch.constant.int -1 %5715 = torch.prim.ListConstruct %int-1_7296 : (!torch.int) -> !torch.list %true_7297 = torch.constant.bool true %none_7298 = torch.constant.none %5716 = torch.aten.mean.dim %5714, %5715, %true_7297, %none_7298 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_7299 = torch.constant.float 9.9999999747524271E-7 %int1_7300 = torch.constant.int 1 %5717 = torch.aten.add.Scalar %5716, %float9.999990e-07_7299, %int1_7300 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %5718 = torch.aten.rsqrt %5717 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %5719 = torch.aten.mul.Tensor %5713, %5718 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %5720 = torch.aten.mul.Tensor %5719, %173 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %5721 = torch_c.to_builtin_tensor %5720 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7301 = tensor.cast %5721 : tensor<4x1x3200xf32> to tensor %5722 = torch_c.to_builtin_tensor %174 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5723 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_7301, %5722) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_7302 = tensor.cast %5723 : tensor to tensor<4x1x3200xf32> %5724 = torch_c.from_builtin_tensor %cast_7302 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %5725 = torch_c.to_builtin_tensor %5720 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7303 = tensor.cast %5725 : tensor<4x1x3200xf32> to tensor %5726 = torch_c.to_builtin_tensor %175 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5727 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_7303, %5726) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_7304 = tensor.cast %5727 : tensor to tensor<4x1x3200xf32> %5728 = torch_c.from_builtin_tensor %cast_7304 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %5729 = torch_c.to_builtin_tensor %5720 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7305 = tensor.cast %5729 : tensor<4x1x3200xf32> to tensor %5730 = torch_c.to_builtin_tensor %176 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5731 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_7305, %5730) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_7306 = tensor.cast %5731 : tensor to tensor<4x1x3200xf32> %5732 = torch_c.from_builtin_tensor %cast_7306 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_7307 = torch.constant.int 4 %int1_7308 = torch.constant.int 1 %int32_7309 = torch.constant.int 32 %int100_7310 = torch.constant.int 100 %5733 = torch.prim.ListConstruct %int4_7307, %int1_7308, %int32_7309, %int100_7310 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5734 = torch.aten.view %5724, %5733 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_7311 = torch.constant.int 4 %int1_7312 = torch.constant.int 1 %int32_7313 = torch.constant.int 32 %int100_7314 = torch.constant.int 100 %5735 = torch.prim.ListConstruct %int4_7311, %int1_7312, %int32_7313, %int100_7314 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5736 = torch.aten.view %5728, %5735 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_7315 = torch.constant.int 4 %int1_7316 = torch.constant.int 1 %int32_7317 = torch.constant.int 32 %int100_7318 = torch.constant.int 100 %5737 = torch.prim.ListConstruct %int4_7315, %int1_7316, %int32_7317, %int100_7318 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5738 = torch.aten.view %5732, %5737 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_7319 = torch.constant.int 4 %int1_7320 = torch.constant.int 1 %int32_7321 = torch.constant.int 32 %int-1_7322 = torch.constant.int -1 %int2_7323 = torch.constant.int 2 %5739 = torch.prim.ListConstruct %int4_7319, %int1_7320, %int32_7321, %int-1_7322, %int2_7323 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5740 = torch.aten.view %5734, %5739 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %5741 = torch.aten.view_as_complex %5740 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_7324 = torch.constant.int 4 %int1_7325 = torch.constant.int 1 %int32_7326 = torch.constant.int 32 %int-1_7327 = torch.constant.int -1 %int2_7328 = torch.constant.int 2 %5742 = torch.prim.ListConstruct %int4_7324, %int1_7325, %int32_7326, %int-1_7327, %int2_7328 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5743 = torch.aten.view %5736, %5742 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %5744 = torch.aten.view_as_complex %5743 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %5745 = torch.aten.mul.Tensor %5741, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %5746 = torch.aten.view_as_real %5745 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_7329 = torch.constant.int 4 %int1_7330 = torch.constant.int 1 %int32_7331 = torch.constant.int 32 %int100_7332 = torch.constant.int 100 %5747 = torch.prim.ListConstruct %int4_7329, %int1_7330, %int32_7331, %int100_7332 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5748 = torch.aten.view %5746, %5747 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %5749 = torch.aten.mul.Tensor %5744, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %5750 = torch.aten.view_as_real %5749 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_7333 = torch.constant.int 4 %int1_7334 = torch.constant.int 1 %int32_7335 = torch.constant.int 32 %int100_7336 = torch.constant.int 100 %5751 = torch.prim.ListConstruct %int4_7333, %int1_7334, %int32_7335, %int100_7336 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5752 = torch.aten.view %5750, %5751 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_7337 = torch.constant.int 1 %int1_7338 = torch.constant.int 1 %5753 = torch.aten.add.Scalar %arg2, %int1_7337, %int1_7338 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_7339 = torch.constant.int 0 %int0_7340 = torch.constant.int 0 %5754 = torch.aten.select.int %5753, %int0_7339, %int0_7340 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7341 = torch.constant.int 0 %int0_7342 = torch.constant.int 0 %5755 = torch.aten.select.int %arg3, %int0_7341, %int0_7342 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7343 = torch.constant.int 0 %int0_7344 = torch.constant.int 0 %int9223372036854775807_7345 = torch.constant.int 9223372036854775807 %int1_7346 = torch.constant.int 1 %5756 = torch.aten.slice.Tensor %5755, %int0_7343, %int0_7344, %int9223372036854775807_7345, %int1_7346 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7347 = torch.constant.int 16 %5757 = torch.aten.floor_divide.Scalar %5754, %int16_7347 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7348 = torch.constant.int 0 %5758 = torch.aten.index_select %5756, %int0_7348, %5757 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7349 = torch.constant.int 16 %5759 = torch.aten.remainder.Scalar %5754, %int16_7349 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7350 = torch.constant.none %5760 = torch.aten.clone %542, %none_7350 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7351 = torch.constant.none %5761 = torch.aten.clone %543, %none_7351 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7352 = torch.constant.int 0 %5762 = torch.aten.unsqueeze %5759, %int0_7352 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7353 = torch.constant.int 0 %int0_7354 = torch.constant.int 0 %5763 = torch.aten.select.int %5752, %int0_7353, %int0_7354 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7355 = torch.constant.int 0 %int0_7356 = torch.constant.int 0 %5764 = torch.aten.select.int %5763, %int0_7355, %int0_7356 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_7357 = torch.constant.int -1 %int26_7358 = torch.constant.int 26 %int2_7359 = torch.constant.int 2 %int16_7360 = torch.constant.int 16 %int32_7361 = torch.constant.int 32 %int100_7362 = torch.constant.int 100 %5765 = torch.prim.ListConstruct %int-1_7357, %int26_7358, %int2_7359, %int16_7360, %int32_7361, %int100_7362 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5766 = torch.aten.view %5600, %5765 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %5767 = torch.prim.ListConstruct %5758, %5760, %5761, %5762 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7363 = torch.constant.bool false %5768 = torch.aten.index_put %5766, %5767, %5764, %false_7363 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7364 = torch.constant.int 2662400 %5769 = torch.prim.ListConstruct %731, %int2662400_7364 : (!torch.int, !torch.int) -> !torch.list %5770 = torch.aten.view %5768, %5769 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7365 = torch.constant.int -1 %int26_7366 = torch.constant.int 26 %int2_7367 = torch.constant.int 2 %int16_7368 = torch.constant.int 16 %int32_7369 = torch.constant.int 32 %int100_7370 = torch.constant.int 100 %5771 = torch.prim.ListConstruct %int-1_7365, %int26_7366, %int2_7367, %int16_7368, %int32_7369, %int100_7370 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5772 = torch.aten.view %5770, %5771 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7371 = torch.constant.none %5773 = torch.aten.clone %544, %none_7371 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7372 = torch.constant.none %5774 = torch.aten.clone %545, %none_7372 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7373 = torch.constant.int 0 %5775 = torch.aten.unsqueeze %5759, %int0_7373 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7374 = torch.constant.int 0 %int0_7375 = torch.constant.int 0 %5776 = torch.aten.select.int %5738, %int0_7374, %int0_7375 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7376 = torch.constant.int 0 %int0_7377 = torch.constant.int 0 %5777 = torch.aten.select.int %5776, %int0_7376, %int0_7377 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5778 = torch.prim.ListConstruct %5758, %5773, %5774, %5775 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7378 = torch.constant.bool false %5779 = torch.aten.index_put %5772, %5778, %5777, %false_7378 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7379 = torch.constant.int 2662400 %5780 = torch.prim.ListConstruct %731, %int2662400_7379 : (!torch.int, !torch.int) -> !torch.list %5781 = torch.aten.view %5779, %5780 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7380 = torch.constant.int -1 %int26_7381 = torch.constant.int 26 %int2_7382 = torch.constant.int 2 %int16_7383 = torch.constant.int 16 %int32_7384 = torch.constant.int 32 %int100_7385 = torch.constant.int 100 %5782 = torch.prim.ListConstruct %int-1_7380, %int26_7381, %int2_7382, %int16_7383, %int32_7384, %int100_7385 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5783 = torch.aten.view %5781, %5782 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_7386 = torch.constant.int 0 %int1_7387 = torch.constant.int 1 %5784 = torch.aten.select.int %5753, %int0_7386, %int1_7387 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7388 = torch.constant.int 0 %int1_7389 = torch.constant.int 1 %5785 = torch.aten.select.int %arg3, %int0_7388, %int1_7389 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7390 = torch.constant.int 0 %int0_7391 = torch.constant.int 0 %int9223372036854775807_7392 = torch.constant.int 9223372036854775807 %int1_7393 = torch.constant.int 1 %5786 = torch.aten.slice.Tensor %5785, %int0_7390, %int0_7391, %int9223372036854775807_7392, %int1_7393 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7394 = torch.constant.int 16 %5787 = torch.aten.floor_divide.Scalar %5784, %int16_7394 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7395 = torch.constant.int 0 %5788 = torch.aten.index_select %5786, %int0_7395, %5787 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7396 = torch.constant.int 16 %5789 = torch.aten.remainder.Scalar %5784, %int16_7396 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7397 = torch.constant.none %5790 = torch.aten.clone %546, %none_7397 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7398 = torch.constant.none %5791 = torch.aten.clone %547, %none_7398 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7399 = torch.constant.int 0 %5792 = torch.aten.unsqueeze %5789, %int0_7399 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7400 = torch.constant.int 0 %int1_7401 = torch.constant.int 1 %5793 = torch.aten.select.int %5752, %int0_7400, %int1_7401 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7402 = torch.constant.int 0 %int0_7403 = torch.constant.int 0 %5794 = torch.aten.select.int %5793, %int0_7402, %int0_7403 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5795 = torch.prim.ListConstruct %5788, %5790, %5791, %5792 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7404 = torch.constant.bool false %5796 = torch.aten.index_put %5783, %5795, %5794, %false_7404 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7405 = torch.constant.int 2662400 %5797 = torch.prim.ListConstruct %731, %int2662400_7405 : (!torch.int, !torch.int) -> !torch.list %5798 = torch.aten.view %5796, %5797 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7406 = torch.constant.int -1 %int26_7407 = torch.constant.int 26 %int2_7408 = torch.constant.int 2 %int16_7409 = torch.constant.int 16 %int32_7410 = torch.constant.int 32 %int100_7411 = torch.constant.int 100 %5799 = torch.prim.ListConstruct %int-1_7406, %int26_7407, %int2_7408, %int16_7409, %int32_7410, %int100_7411 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5800 = torch.aten.view %5798, %5799 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7412 = torch.constant.none %5801 = torch.aten.clone %548, %none_7412 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7413 = torch.constant.none %5802 = torch.aten.clone %549, %none_7413 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7414 = torch.constant.int 0 %5803 = torch.aten.unsqueeze %5789, %int0_7414 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7415 = torch.constant.int 0 %int1_7416 = torch.constant.int 1 %5804 = torch.aten.select.int %5738, %int0_7415, %int1_7416 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7417 = torch.constant.int 0 %int0_7418 = torch.constant.int 0 %5805 = torch.aten.select.int %5804, %int0_7417, %int0_7418 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5806 = torch.prim.ListConstruct %5788, %5801, %5802, %5803 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7419 = torch.constant.bool false %5807 = torch.aten.index_put %5800, %5806, %5805, %false_7419 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7420 = torch.constant.int 2662400 %5808 = torch.prim.ListConstruct %731, %int2662400_7420 : (!torch.int, !torch.int) -> !torch.list %5809 = torch.aten.view %5807, %5808 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7421 = torch.constant.int -1 %int26_7422 = torch.constant.int 26 %int2_7423 = torch.constant.int 2 %int16_7424 = torch.constant.int 16 %int32_7425 = torch.constant.int 32 %int100_7426 = torch.constant.int 100 %5810 = torch.prim.ListConstruct %int-1_7421, %int26_7422, %int2_7423, %int16_7424, %int32_7425, %int100_7426 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5811 = torch.aten.view %5809, %5810 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_7427 = torch.constant.int 0 %int2_7428 = torch.constant.int 2 %5812 = torch.aten.select.int %5753, %int0_7427, %int2_7428 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7429 = torch.constant.int 0 %int2_7430 = torch.constant.int 2 %5813 = torch.aten.select.int %arg3, %int0_7429, %int2_7430 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7431 = torch.constant.int 0 %int0_7432 = torch.constant.int 0 %int9223372036854775807_7433 = torch.constant.int 9223372036854775807 %int1_7434 = torch.constant.int 1 %5814 = torch.aten.slice.Tensor %5813, %int0_7431, %int0_7432, %int9223372036854775807_7433, %int1_7434 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7435 = torch.constant.int 16 %5815 = torch.aten.floor_divide.Scalar %5812, %int16_7435 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7436 = torch.constant.int 0 %5816 = torch.aten.index_select %5814, %int0_7436, %5815 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7437 = torch.constant.int 16 %5817 = torch.aten.remainder.Scalar %5812, %int16_7437 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7438 = torch.constant.none %5818 = torch.aten.clone %550, %none_7438 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7439 = torch.constant.none %5819 = torch.aten.clone %551, %none_7439 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7440 = torch.constant.int 0 %5820 = torch.aten.unsqueeze %5817, %int0_7440 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7441 = torch.constant.int 0 %int2_7442 = torch.constant.int 2 %5821 = torch.aten.select.int %5752, %int0_7441, %int2_7442 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7443 = torch.constant.int 0 %int0_7444 = torch.constant.int 0 %5822 = torch.aten.select.int %5821, %int0_7443, %int0_7444 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5823 = torch.prim.ListConstruct %5816, %5818, %5819, %5820 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7445 = torch.constant.bool false %5824 = torch.aten.index_put %5811, %5823, %5822, %false_7445 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7446 = torch.constant.int 2662400 %5825 = torch.prim.ListConstruct %731, %int2662400_7446 : (!torch.int, !torch.int) -> !torch.list %5826 = torch.aten.view %5824, %5825 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7447 = torch.constant.int -1 %int26_7448 = torch.constant.int 26 %int2_7449 = torch.constant.int 2 %int16_7450 = torch.constant.int 16 %int32_7451 = torch.constant.int 32 %int100_7452 = torch.constant.int 100 %5827 = torch.prim.ListConstruct %int-1_7447, %int26_7448, %int2_7449, %int16_7450, %int32_7451, %int100_7452 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5828 = torch.aten.view %5826, %5827 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7453 = torch.constant.none %5829 = torch.aten.clone %552, %none_7453 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7454 = torch.constant.none %5830 = torch.aten.clone %553, %none_7454 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7455 = torch.constant.int 0 %5831 = torch.aten.unsqueeze %5817, %int0_7455 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7456 = torch.constant.int 0 %int2_7457 = torch.constant.int 2 %5832 = torch.aten.select.int %5738, %int0_7456, %int2_7457 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7458 = torch.constant.int 0 %int0_7459 = torch.constant.int 0 %5833 = torch.aten.select.int %5832, %int0_7458, %int0_7459 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5834 = torch.prim.ListConstruct %5816, %5829, %5830, %5831 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7460 = torch.constant.bool false %5835 = torch.aten.index_put %5828, %5834, %5833, %false_7460 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7461 = torch.constant.int 2662400 %5836 = torch.prim.ListConstruct %731, %int2662400_7461 : (!torch.int, !torch.int) -> !torch.list %5837 = torch.aten.view %5835, %5836 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7462 = torch.constant.int -1 %int26_7463 = torch.constant.int 26 %int2_7464 = torch.constant.int 2 %int16_7465 = torch.constant.int 16 %int32_7466 = torch.constant.int 32 %int100_7467 = torch.constant.int 100 %5838 = torch.prim.ListConstruct %int-1_7462, %int26_7463, %int2_7464, %int16_7465, %int32_7466, %int100_7467 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5839 = torch.aten.view %5837, %5838 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_7468 = torch.constant.int 0 %int3_7469 = torch.constant.int 3 %5840 = torch.aten.select.int %5753, %int0_7468, %int3_7469 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7470 = torch.constant.int 0 %int3_7471 = torch.constant.int 3 %5841 = torch.aten.select.int %arg3, %int0_7470, %int3_7471 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7472 = torch.constant.int 0 %int0_7473 = torch.constant.int 0 %int9223372036854775807_7474 = torch.constant.int 9223372036854775807 %int1_7475 = torch.constant.int 1 %5842 = torch.aten.slice.Tensor %5841, %int0_7472, %int0_7473, %int9223372036854775807_7474, %int1_7475 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7476 = torch.constant.int 16 %5843 = torch.aten.floor_divide.Scalar %5840, %int16_7476 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7477 = torch.constant.int 0 %5844 = torch.aten.index_select %5842, %int0_7477, %5843 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7478 = torch.constant.int 16 %5845 = torch.aten.remainder.Scalar %5840, %int16_7478 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7479 = torch.constant.none %5846 = torch.aten.clone %554, %none_7479 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7480 = torch.constant.none %5847 = torch.aten.clone %555, %none_7480 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7481 = torch.constant.int 0 %5848 = torch.aten.unsqueeze %5845, %int0_7481 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7482 = torch.constant.int 0 %int3_7483 = torch.constant.int 3 %5849 = torch.aten.select.int %5752, %int0_7482, %int3_7483 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7484 = torch.constant.int 0 %int0_7485 = torch.constant.int 0 %5850 = torch.aten.select.int %5849, %int0_7484, %int0_7485 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5851 = torch.prim.ListConstruct %5844, %5846, %5847, %5848 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7486 = torch.constant.bool false %5852 = torch.aten.index_put %5839, %5851, %5850, %false_7486 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7487 = torch.constant.int 2662400 %5853 = torch.prim.ListConstruct %731, %int2662400_7487 : (!torch.int, !torch.int) -> !torch.list %5854 = torch.aten.view %5852, %5853 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7488 = torch.constant.int -1 %int26_7489 = torch.constant.int 26 %int2_7490 = torch.constant.int 2 %int16_7491 = torch.constant.int 16 %int32_7492 = torch.constant.int 32 %int100_7493 = torch.constant.int 100 %5855 = torch.prim.ListConstruct %int-1_7488, %int26_7489, %int2_7490, %int16_7491, %int32_7492, %int100_7493 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5856 = torch.aten.view %5854, %5855 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7494 = torch.constant.none %5857 = torch.aten.clone %556, %none_7494 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7495 = torch.constant.none %5858 = torch.aten.clone %557, %none_7495 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7496 = torch.constant.int 0 %5859 = torch.aten.unsqueeze %5845, %int0_7496 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7497 = torch.constant.int 0 %int3_7498 = torch.constant.int 3 %5860 = torch.aten.select.int %5738, %int0_7497, %int3_7498 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7499 = torch.constant.int 0 %int0_7500 = torch.constant.int 0 %5861 = torch.aten.select.int %5860, %int0_7499, %int0_7500 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %5862 = torch.prim.ListConstruct %5844, %5857, %5858, %5859 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7501 = torch.constant.bool false %5863 = torch.aten.index_put %5856, %5862, %5861, %false_7501 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7502 = torch.constant.int 2662400 %5864 = torch.prim.ListConstruct %731, %int2662400_7502 : (!torch.int, !torch.int) -> !torch.list %5865 = torch.aten.view %5863, %5864 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_7503 = torch.constant.int 52 %5866 = torch.aten.mul.Scalar %arg3, %int52_7503 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int38 = torch.constant.int 38 %int1_7504 = torch.constant.int 1 %5867 = torch.aten.add.Scalar %5866, %int38, %int1_7504 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_7505 = torch.constant.int 4 %5868 = torch.aten.mul.int %int4_7505, %655 : !torch.int, !torch.int -> !torch.int %5869 = torch.prim.ListConstruct %5868 : (!torch.int) -> !torch.list %5870 = torch.aten.view %5867, %5869 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_7506 = torch.constant.int -1 %int26_7507 = torch.constant.int 26 %int2_7508 = torch.constant.int 2 %int16_7509 = torch.constant.int 16 %int32_7510 = torch.constant.int 32 %int100_7511 = torch.constant.int 100 %5871 = torch.prim.ListConstruct %int-1_7506, %int26_7507, %int2_7508, %int16_7509, %int32_7510, %int100_7511 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5872 = torch.aten.view %5865, %5871 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_7512 = torch.constant.int 26 %5873 = torch.aten.mul.int %731, %int26_7512 : !torch.int, !torch.int -> !torch.int %int2_7513 = torch.constant.int 2 %5874 = torch.aten.mul.int %5873, %int2_7513 : !torch.int, !torch.int -> !torch.int %int16_7514 = torch.constant.int 16 %int32_7515 = torch.constant.int 32 %int100_7516 = torch.constant.int 100 %5875 = torch.prim.ListConstruct %5874, %int16_7514, %int32_7515, %int100_7516 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5876 = torch.aten.view %5872, %5875 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_7517 = torch.constant.int 0 %5877 = torch.aten.index_select %5876, %int0_7517, %5870 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_7518 = torch.constant.int 4 %int16_7519 = torch.constant.int 16 %int32_7520 = torch.constant.int 32 %int100_7521 = torch.constant.int 100 %5878 = torch.prim.ListConstruct %int4_7518, %655, %int16_7519, %int32_7520, %int100_7521 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5879 = torch.aten.view %5877, %5878 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_7522 = torch.constant.int 1 %5880 = torch.aten.size.int %5879, %int1_7522 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_7523 = torch.constant.int 16 %5881 = torch.aten.mul.int %5880, %int16_7523 : !torch.int, !torch.int -> !torch.int %int4_7524 = torch.constant.int 4 %int32_7525 = torch.constant.int 32 %int100_7526 = torch.constant.int 100 %5882 = torch.prim.ListConstruct %int4_7524, %5881, %int32_7525, %int100_7526 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5883 = torch.aten.view %5879, %5882 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_7527 = torch.constant.int 0 %int0_7528 = torch.constant.int 0 %int9223372036854775807_7529 = torch.constant.int 9223372036854775807 %int1_7530 = torch.constant.int 1 %5884 = torch.aten.slice.Tensor %5625, %int0_7527, %int0_7528, %int9223372036854775807_7529, %int1_7530 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_7531 = torch.constant.int 16 %5885 = torch.aten.mul.int %655, %int16_7531 : !torch.int, !torch.int -> !torch.int %int1_7532 = torch.constant.int 1 %int0_7533 = torch.constant.int 0 %int1_7534 = torch.constant.int 1 %5886 = torch.aten.slice.Tensor %5884, %int1_7532, %int0_7533, %5885, %int1_7534 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_7535 = torch.constant.bool false %5887 = torch.aten.copy %5886, %5883, %false_7535 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_7536 = torch.constant.int 0 %int0_7537 = torch.constant.int 0 %int9223372036854775807_7538 = torch.constant.int 9223372036854775807 %int1_7539 = torch.constant.int 1 %5888 = torch.aten.slice.Tensor %5625, %int0_7536, %int0_7537, %int9223372036854775807_7538, %int1_7539 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7540 = torch.constant.int 1 %int0_7541 = torch.constant.int 0 %int1_7542 = torch.constant.int 1 %5889 = torch.aten.slice_scatter %5888, %5887, %int1_7540, %int0_7541, %5885, %int1_7542 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_7543 = torch.constant.int 0 %int0_7544 = torch.constant.int 0 %int9223372036854775807_7545 = torch.constant.int 9223372036854775807 %int1_7546 = torch.constant.int 1 %5890 = torch.aten.slice_scatter %5625, %5889, %int0_7543, %int0_7544, %int9223372036854775807_7545, %int1_7546 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7547 = torch.constant.int 1 %int1_7548 = torch.constant.int 1 %5891 = torch.aten.add.Scalar %5867, %int1_7547, %int1_7548 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_7549 = torch.constant.int 4 %5892 = torch.aten.mul.int %int4_7549, %655 : !torch.int, !torch.int -> !torch.int %5893 = torch.prim.ListConstruct %5892 : (!torch.int) -> !torch.list %5894 = torch.aten.view %5891, %5893 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_7550 = torch.constant.int 0 %5895 = torch.aten.index_select %5876, %int0_7550, %5894 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_7551 = torch.constant.int 4 %int16_7552 = torch.constant.int 16 %int32_7553 = torch.constant.int 32 %int100_7554 = torch.constant.int 100 %5896 = torch.prim.ListConstruct %int4_7551, %655, %int16_7552, %int32_7553, %int100_7554 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5897 = torch.aten.view %5895, %5896 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_7555 = torch.constant.int 1 %5898 = torch.aten.size.int %5897, %int1_7555 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_7556 = torch.constant.int 16 %5899 = torch.aten.mul.int %5898, %int16_7556 : !torch.int, !torch.int -> !torch.int %int4_7557 = torch.constant.int 4 %int32_7558 = torch.constant.int 32 %int100_7559 = torch.constant.int 100 %5900 = torch.prim.ListConstruct %int4_7557, %5899, %int32_7558, %int100_7559 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5901 = torch.aten.view %5897, %5900 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_7560 = torch.constant.int 0 %int0_7561 = torch.constant.int 0 %int9223372036854775807_7562 = torch.constant.int 9223372036854775807 %int1_7563 = torch.constant.int 1 %5902 = torch.aten.slice.Tensor %5642, %int0_7560, %int0_7561, %int9223372036854775807_7562, %int1_7563 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7564 = torch.constant.int 1 %int0_7565 = torch.constant.int 0 %int1_7566 = torch.constant.int 1 %5903 = torch.aten.slice.Tensor %5902, %int1_7564, %int0_7565, %5885, %int1_7566 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_7567 = torch.constant.bool false %5904 = torch.aten.copy %5903, %5901, %false_7567 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_7568 = torch.constant.int 0 %int0_7569 = torch.constant.int 0 %int9223372036854775807_7570 = torch.constant.int 9223372036854775807 %int1_7571 = torch.constant.int 1 %5905 = torch.aten.slice.Tensor %5642, %int0_7568, %int0_7569, %int9223372036854775807_7570, %int1_7571 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7572 = torch.constant.int 1 %int0_7573 = torch.constant.int 0 %int1_7574 = torch.constant.int 1 %5906 = torch.aten.slice_scatter %5905, %5904, %int1_7572, %int0_7573, %5885, %int1_7574 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_7575 = torch.constant.int 0 %int0_7576 = torch.constant.int 0 %int9223372036854775807_7577 = torch.constant.int 9223372036854775807 %int1_7578 = torch.constant.int 1 %5907 = torch.aten.slice_scatter %5642, %5906, %int0_7575, %int0_7576, %int9223372036854775807_7577, %int1_7578 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_7579 = torch.constant.int 0 %int0_7580 = torch.constant.int 0 %int9223372036854775807_7581 = torch.constant.int 9223372036854775807 %int1_7582 = torch.constant.int 1 %5908 = torch.aten.slice.Tensor %671, %int0_7579, %int0_7580, %int9223372036854775807_7581, %int1_7582 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7583 = torch.constant.int 1 %int0_7584 = torch.constant.int 0 %int1_7585 = torch.constant.int 1 %5909 = torch.aten.slice.Tensor %5908, %int1_7583, %int0_7584, %5885, %int1_7585 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_7586 = torch.constant.int 0 %int0_7587 = torch.constant.int 0 %int9223372036854775807_7588 = torch.constant.int 9223372036854775807 %int1_7589 = torch.constant.int 1 %5910 = torch.aten.slice.Tensor %673, %int0_7586, %int0_7587, %int9223372036854775807_7588, %int1_7589 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7590 = torch.constant.int 1 %int0_7591 = torch.constant.int 0 %int1_7592 = torch.constant.int 1 %5911 = torch.aten.slice.Tensor %5910, %int1_7590, %int0_7591, %5885, %int1_7592 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_7593 = torch.constant.int 1 %int2_7594 = torch.constant.int 2 %5912 = torch.aten.transpose.int %5748, %int1_7593, %int2_7594 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_7595 = torch.constant.int 4 %int32_7596 = torch.constant.int 32 %int1_7597 = torch.constant.int 1 %int100_7598 = torch.constant.int 100 %5913 = torch.prim.ListConstruct %int4_7595, %int32_7596, %int1_7597, %int100_7598 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_7599 = torch.constant.bool false %5914 = torch.aten.expand %5912, %5913, %false_7599 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_7600 = torch.constant.int 128 %int1_7601 = torch.constant.int 1 %int100_7602 = torch.constant.int 100 %5915 = torch.prim.ListConstruct %int128_7600, %int1_7601, %int100_7602 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5916 = torch.aten.view %5914, %5915 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_7603 = torch.constant.int 0 %int0_7604 = torch.constant.int 0 %int9223372036854775807_7605 = torch.constant.int 9223372036854775807 %int1_7606 = torch.constant.int 1 %5917 = torch.aten.slice.Tensor %5890, %int0_7603, %int0_7604, %int9223372036854775807_7605, %int1_7606 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7607 = torch.constant.int 1 %int0_7608 = torch.constant.int 0 %int1_7609 = torch.constant.int 1 %5918 = torch.aten.slice.Tensor %5917, %int1_7607, %int0_7608, %5885, %int1_7609 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_7610 = torch.constant.int 1 %int2_7611 = torch.constant.int 2 %5919 = torch.aten.transpose.int %5918, %int1_7610, %int2_7611 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_7612 = torch.constant.int 2 %int3_7613 = torch.constant.int 3 %5920 = torch.aten.transpose.int %5919, %int2_7612, %int3_7613 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_7614 = torch.constant.int 1 %5921 = torch.aten.size.int %5909, %int1_7614 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_7615 = torch.constant.int 4 %int32_7616 = torch.constant.int 32 %int100_7617 = torch.constant.int 100 %5922 = torch.prim.ListConstruct %int4_7615, %int32_7616, %int100_7617, %5921 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_7618 = torch.constant.bool false %5923 = torch.aten.expand %5920, %5922, %false_7618 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_7619 = torch.constant.int 0 %5924 = torch.aten.clone %5923, %int0_7619 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_7620 = torch.constant.int 128 %int100_7621 = torch.constant.int 100 %5925 = torch.prim.ListConstruct %int128_7620, %int100_7621, %5921 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5926 = torch.aten._unsafe_view %5924, %5925 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %5927 = torch.aten.bmm %5916, %5926 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_7622 = torch.constant.int 4 %int32_7623 = torch.constant.int 32 %int1_7624 = torch.constant.int 1 %5928 = torch.prim.ListConstruct %int4_7622, %int32_7623, %int1_7624, %5921 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5929 = torch.aten.view %5927, %5928 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_7625 = torch.constant.float 1.000000e+01 %5930 = torch.aten.div.Scalar %5929, %float1.000000e01_7625 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_7626 = torch.constant.int 1 %5931 = torch.aten.add.Tensor %5930, %895, %int1_7626 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_7627 = torch.constant.int -1 %false_7628 = torch.constant.bool false %5932 = torch.aten._softmax %5931, %int-1_7627, %false_7628 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_7629 = torch.constant.int 4 %int32_7630 = torch.constant.int 32 %int1_7631 = torch.constant.int 1 %5933 = torch.prim.ListConstruct %int4_7629, %int32_7630, %int1_7631, %5921 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_7632 = torch.constant.bool false %5934 = torch.aten.expand %5932, %5933, %false_7632 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_7633 = torch.constant.int 128 %int1_7634 = torch.constant.int 1 %5935 = torch.prim.ListConstruct %int128_7633, %int1_7634, %5921 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5936 = torch.aten.view %5934, %5935 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_7635 = torch.constant.int 0 %int0_7636 = torch.constant.int 0 %int9223372036854775807_7637 = torch.constant.int 9223372036854775807 %int1_7638 = torch.constant.int 1 %5937 = torch.aten.slice.Tensor %5907, %int0_7635, %int0_7636, %int9223372036854775807_7637, %int1_7638 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7639 = torch.constant.int 1 %int0_7640 = torch.constant.int 0 %int1_7641 = torch.constant.int 1 %5938 = torch.aten.slice.Tensor %5937, %int1_7639, %int0_7640, %5885, %int1_7641 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_7642 = torch.constant.int 1 %int2_7643 = torch.constant.int 2 %5939 = torch.aten.transpose.int %5938, %int1_7642, %int2_7643 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_7644 = torch.constant.int 1 %5940 = torch.aten.size.int %5911, %int1_7644 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_7645 = torch.constant.int 4 %int32_7646 = torch.constant.int 32 %int100_7647 = torch.constant.int 100 %5941 = torch.prim.ListConstruct %int4_7645, %int32_7646, %5940, %int100_7647 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_7648 = torch.constant.bool false %5942 = torch.aten.expand %5939, %5941, %false_7648 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_7649 = torch.constant.int 0 %5943 = torch.aten.clone %5942, %int0_7649 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_7650 = torch.constant.int 128 %int100_7651 = torch.constant.int 100 %5944 = torch.prim.ListConstruct %int128_7650, %5940, %int100_7651 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5945 = torch.aten._unsafe_view %5943, %5944 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %5946 = torch.aten.bmm %5936, %5945 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_7652 = torch.constant.int 4 %int32_7653 = torch.constant.int 32 %int1_7654 = torch.constant.int 1 %int100_7655 = torch.constant.int 100 %5947 = torch.prim.ListConstruct %int4_7652, %int32_7653, %int1_7654, %int100_7655 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5948 = torch.aten.view %5946, %5947 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_7656 = torch.constant.int 1 %int2_7657 = torch.constant.int 2 %5949 = torch.aten.transpose.int %5948, %int1_7656, %int2_7657 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_7658 = torch.constant.int 4 %int1_7659 = torch.constant.int 1 %int-1_7660 = torch.constant.int -1 %5950 = torch.prim.ListConstruct %int4_7658, %int1_7659, %int-1_7660 : (!torch.int, !torch.int, !torch.int) -> !torch.list %5951 = torch.aten.view %5949, %5950 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %5952 = torch_c.to_builtin_tensor %5951 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7661 = tensor.cast %5952 : tensor<4x1x3200xf32> to tensor %5953 = torch_c.to_builtin_tensor %177 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5954 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_7661, %5953) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_7662 = tensor.cast %5954 : tensor to tensor<4x1x3200xf32> %5955 = torch_c.from_builtin_tensor %cast_7662 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_7663 = torch.constant.int 1 %5956 = torch.aten.add.Tensor %5713, %5955, %int1_7663 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_7664 = torch.constant.int 2 %5957 = torch.aten.pow.Tensor_Scalar %5956, %int2_7664 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_7665 = torch.constant.int -1 %5958 = torch.prim.ListConstruct %int-1_7665 : (!torch.int) -> !torch.list %true_7666 = torch.constant.bool true %none_7667 = torch.constant.none %5959 = torch.aten.mean.dim %5957, %5958, %true_7666, %none_7667 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_7668 = torch.constant.float 9.9999999747524271E-7 %int1_7669 = torch.constant.int 1 %5960 = torch.aten.add.Scalar %5959, %float9.999990e-07_7668, %int1_7669 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %5961 = torch.aten.rsqrt %5960 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %5962 = torch.aten.mul.Tensor %5956, %5961 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %5963 = torch.aten.mul.Tensor %5962, %178 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %5964 = torch_c.to_builtin_tensor %5963 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7670 = tensor.cast %5964 : tensor<4x1x3200xf32> to tensor %5965 = torch_c.to_builtin_tensor %179 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %5966 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_7670, %5965) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_7671 = tensor.cast %5966 : tensor to tensor<4x1x8640xf32> %5967 = torch_c.from_builtin_tensor %cast_7671 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %5968 = torch.aten.silu %5967 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %5969 = torch_c.to_builtin_tensor %5963 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7672 = tensor.cast %5969 : tensor<4x1x3200xf32> to tensor %5970 = torch_c.to_builtin_tensor %180 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %5971 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_7672, %5970) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_7673 = tensor.cast %5971 : tensor to tensor<4x1x8640xf32> %5972 = torch_c.from_builtin_tensor %cast_7673 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %5973 = torch.aten.mul.Tensor %5968, %5972 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %5974 = torch_c.to_builtin_tensor %5973 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_7674 = tensor.cast %5974 : tensor<4x1x8640xf32> to tensor %5975 = torch_c.to_builtin_tensor %181 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %5976 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_7674, %5975) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_7675 = tensor.cast %5976 : tensor to tensor<4x1x3200xf32> %5977 = torch_c.from_builtin_tensor %cast_7675 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_7676 = torch.constant.int 1 %5978 = torch.aten.add.Tensor %5956, %5977, %int1_7676 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_7677 = torch.constant.int 2 %5979 = torch.aten.pow.Tensor_Scalar %5978, %int2_7677 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_7678 = torch.constant.int -1 %5980 = torch.prim.ListConstruct %int-1_7678 : (!torch.int) -> !torch.list %true_7679 = torch.constant.bool true %none_7680 = torch.constant.none %5981 = torch.aten.mean.dim %5979, %5980, %true_7679, %none_7680 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_7681 = torch.constant.float 9.9999999747524271E-7 %int1_7682 = torch.constant.int 1 %5982 = torch.aten.add.Scalar %5981, %float9.999990e-07_7681, %int1_7682 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %5983 = torch.aten.rsqrt %5982 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %5984 = torch.aten.mul.Tensor %5978, %5983 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %5985 = torch.aten.mul.Tensor %5984, %182 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %5986 = torch_c.to_builtin_tensor %5985 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7683 = tensor.cast %5986 : tensor<4x1x3200xf32> to tensor %5987 = torch_c.to_builtin_tensor %183 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5988 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_7683, %5987) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_7684 = tensor.cast %5988 : tensor to tensor<4x1x3200xf32> %5989 = torch_c.from_builtin_tensor %cast_7684 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %5990 = torch_c.to_builtin_tensor %5985 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7685 = tensor.cast %5990 : tensor<4x1x3200xf32> to tensor %5991 = torch_c.to_builtin_tensor %184 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5992 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_7685, %5991) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_7686 = tensor.cast %5992 : tensor to tensor<4x1x3200xf32> %5993 = torch_c.from_builtin_tensor %cast_7686 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %5994 = torch_c.to_builtin_tensor %5985 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_7687 = tensor.cast %5994 : tensor<4x1x3200xf32> to tensor %5995 = torch_c.to_builtin_tensor %185 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %5996 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_7687, %5995) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_7688 = tensor.cast %5996 : tensor to tensor<4x1x3200xf32> %5997 = torch_c.from_builtin_tensor %cast_7688 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_7689 = torch.constant.int 4 %int1_7690 = torch.constant.int 1 %int32_7691 = torch.constant.int 32 %int100_7692 = torch.constant.int 100 %5998 = torch.prim.ListConstruct %int4_7689, %int1_7690, %int32_7691, %int100_7692 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %5999 = torch.aten.view %5989, %5998 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_7693 = torch.constant.int 4 %int1_7694 = torch.constant.int 1 %int32_7695 = torch.constant.int 32 %int100_7696 = torch.constant.int 100 %6000 = torch.prim.ListConstruct %int4_7693, %int1_7694, %int32_7695, %int100_7696 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6001 = torch.aten.view %5993, %6000 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_7697 = torch.constant.int 4 %int1_7698 = torch.constant.int 1 %int32_7699 = torch.constant.int 32 %int100_7700 = torch.constant.int 100 %6002 = torch.prim.ListConstruct %int4_7697, %int1_7698, %int32_7699, %int100_7700 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6003 = torch.aten.view %5997, %6002 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_7701 = torch.constant.int 4 %int1_7702 = torch.constant.int 1 %int32_7703 = torch.constant.int 32 %int-1_7704 = torch.constant.int -1 %int2_7705 = torch.constant.int 2 %6004 = torch.prim.ListConstruct %int4_7701, %int1_7702, %int32_7703, %int-1_7704, %int2_7705 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6005 = torch.aten.view %5999, %6004 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %6006 = torch.aten.view_as_complex %6005 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_7706 = torch.constant.int 4 %int1_7707 = torch.constant.int 1 %int32_7708 = torch.constant.int 32 %int-1_7709 = torch.constant.int -1 %int2_7710 = torch.constant.int 2 %6007 = torch.prim.ListConstruct %int4_7706, %int1_7707, %int32_7708, %int-1_7709, %int2_7710 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6008 = torch.aten.view %6001, %6007 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %6009 = torch.aten.view_as_complex %6008 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %6010 = torch.aten.mul.Tensor %6006, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %6011 = torch.aten.view_as_real %6010 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_7711 = torch.constant.int 4 %int1_7712 = torch.constant.int 1 %int32_7713 = torch.constant.int 32 %int100_7714 = torch.constant.int 100 %6012 = torch.prim.ListConstruct %int4_7711, %int1_7712, %int32_7713, %int100_7714 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6013 = torch.aten.view %6011, %6012 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %6014 = torch.aten.mul.Tensor %6009, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %6015 = torch.aten.view_as_real %6014 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_7715 = torch.constant.int 4 %int1_7716 = torch.constant.int 1 %int32_7717 = torch.constant.int 32 %int100_7718 = torch.constant.int 100 %6016 = torch.prim.ListConstruct %int4_7715, %int1_7716, %int32_7717, %int100_7718 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6017 = torch.aten.view %6015, %6016 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_7719 = torch.constant.int 1 %int1_7720 = torch.constant.int 1 %6018 = torch.aten.add.Scalar %arg2, %int1_7719, %int1_7720 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_7721 = torch.constant.int 0 %int0_7722 = torch.constant.int 0 %6019 = torch.aten.select.int %6018, %int0_7721, %int0_7722 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7723 = torch.constant.int 0 %int0_7724 = torch.constant.int 0 %6020 = torch.aten.select.int %arg3, %int0_7723, %int0_7724 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7725 = torch.constant.int 0 %int0_7726 = torch.constant.int 0 %int9223372036854775807_7727 = torch.constant.int 9223372036854775807 %int1_7728 = torch.constant.int 1 %6021 = torch.aten.slice.Tensor %6020, %int0_7725, %int0_7726, %int9223372036854775807_7727, %int1_7728 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7729 = torch.constant.int 16 %6022 = torch.aten.floor_divide.Scalar %6019, %int16_7729 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7730 = torch.constant.int 0 %6023 = torch.aten.index_select %6021, %int0_7730, %6022 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7731 = torch.constant.int 16 %6024 = torch.aten.remainder.Scalar %6019, %int16_7731 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7732 = torch.constant.none %6025 = torch.aten.clone %558, %none_7732 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7733 = torch.constant.none %6026 = torch.aten.clone %559, %none_7733 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7734 = torch.constant.int 0 %6027 = torch.aten.unsqueeze %6024, %int0_7734 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7735 = torch.constant.int 0 %int0_7736 = torch.constant.int 0 %6028 = torch.aten.select.int %6017, %int0_7735, %int0_7736 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7737 = torch.constant.int 0 %int0_7738 = torch.constant.int 0 %6029 = torch.aten.select.int %6028, %int0_7737, %int0_7738 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_7739 = torch.constant.int -1 %int26_7740 = torch.constant.int 26 %int2_7741 = torch.constant.int 2 %int16_7742 = torch.constant.int 16 %int32_7743 = torch.constant.int 32 %int100_7744 = torch.constant.int 100 %6030 = torch.prim.ListConstruct %int-1_7739, %int26_7740, %int2_7741, %int16_7742, %int32_7743, %int100_7744 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6031 = torch.aten.view %5865, %6030 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %6032 = torch.prim.ListConstruct %6023, %6025, %6026, %6027 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7745 = torch.constant.bool false %6033 = torch.aten.index_put %6031, %6032, %6029, %false_7745 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7746 = torch.constant.int 2662400 %6034 = torch.prim.ListConstruct %731, %int2662400_7746 : (!torch.int, !torch.int) -> !torch.list %6035 = torch.aten.view %6033, %6034 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7747 = torch.constant.int -1 %int26_7748 = torch.constant.int 26 %int2_7749 = torch.constant.int 2 %int16_7750 = torch.constant.int 16 %int32_7751 = torch.constant.int 32 %int100_7752 = torch.constant.int 100 %6036 = torch.prim.ListConstruct %int-1_7747, %int26_7748, %int2_7749, %int16_7750, %int32_7751, %int100_7752 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6037 = torch.aten.view %6035, %6036 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7753 = torch.constant.none %6038 = torch.aten.clone %560, %none_7753 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7754 = torch.constant.none %6039 = torch.aten.clone %561, %none_7754 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7755 = torch.constant.int 0 %6040 = torch.aten.unsqueeze %6024, %int0_7755 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7756 = torch.constant.int 0 %int0_7757 = torch.constant.int 0 %6041 = torch.aten.select.int %6003, %int0_7756, %int0_7757 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7758 = torch.constant.int 0 %int0_7759 = torch.constant.int 0 %6042 = torch.aten.select.int %6041, %int0_7758, %int0_7759 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6043 = torch.prim.ListConstruct %6023, %6038, %6039, %6040 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7760 = torch.constant.bool false %6044 = torch.aten.index_put %6037, %6043, %6042, %false_7760 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7761 = torch.constant.int 2662400 %6045 = torch.prim.ListConstruct %731, %int2662400_7761 : (!torch.int, !torch.int) -> !torch.list %6046 = torch.aten.view %6044, %6045 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7762 = torch.constant.int -1 %int26_7763 = torch.constant.int 26 %int2_7764 = torch.constant.int 2 %int16_7765 = torch.constant.int 16 %int32_7766 = torch.constant.int 32 %int100_7767 = torch.constant.int 100 %6047 = torch.prim.ListConstruct %int-1_7762, %int26_7763, %int2_7764, %int16_7765, %int32_7766, %int100_7767 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6048 = torch.aten.view %6046, %6047 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_7768 = torch.constant.int 0 %int1_7769 = torch.constant.int 1 %6049 = torch.aten.select.int %6018, %int0_7768, %int1_7769 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7770 = torch.constant.int 0 %int1_7771 = torch.constant.int 1 %6050 = torch.aten.select.int %arg3, %int0_7770, %int1_7771 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7772 = torch.constant.int 0 %int0_7773 = torch.constant.int 0 %int9223372036854775807_7774 = torch.constant.int 9223372036854775807 %int1_7775 = torch.constant.int 1 %6051 = torch.aten.slice.Tensor %6050, %int0_7772, %int0_7773, %int9223372036854775807_7774, %int1_7775 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7776 = torch.constant.int 16 %6052 = torch.aten.floor_divide.Scalar %6049, %int16_7776 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7777 = torch.constant.int 0 %6053 = torch.aten.index_select %6051, %int0_7777, %6052 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7778 = torch.constant.int 16 %6054 = torch.aten.remainder.Scalar %6049, %int16_7778 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7779 = torch.constant.none %6055 = torch.aten.clone %562, %none_7779 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7780 = torch.constant.none %6056 = torch.aten.clone %563, %none_7780 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7781 = torch.constant.int 0 %6057 = torch.aten.unsqueeze %6054, %int0_7781 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7782 = torch.constant.int 0 %int1_7783 = torch.constant.int 1 %6058 = torch.aten.select.int %6017, %int0_7782, %int1_7783 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7784 = torch.constant.int 0 %int0_7785 = torch.constant.int 0 %6059 = torch.aten.select.int %6058, %int0_7784, %int0_7785 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6060 = torch.prim.ListConstruct %6053, %6055, %6056, %6057 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7786 = torch.constant.bool false %6061 = torch.aten.index_put %6048, %6060, %6059, %false_7786 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7787 = torch.constant.int 2662400 %6062 = torch.prim.ListConstruct %731, %int2662400_7787 : (!torch.int, !torch.int) -> !torch.list %6063 = torch.aten.view %6061, %6062 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7788 = torch.constant.int -1 %int26_7789 = torch.constant.int 26 %int2_7790 = torch.constant.int 2 %int16_7791 = torch.constant.int 16 %int32_7792 = torch.constant.int 32 %int100_7793 = torch.constant.int 100 %6064 = torch.prim.ListConstruct %int-1_7788, %int26_7789, %int2_7790, %int16_7791, %int32_7792, %int100_7793 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6065 = torch.aten.view %6063, %6064 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7794 = torch.constant.none %6066 = torch.aten.clone %564, %none_7794 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7795 = torch.constant.none %6067 = torch.aten.clone %565, %none_7795 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7796 = torch.constant.int 0 %6068 = torch.aten.unsqueeze %6054, %int0_7796 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7797 = torch.constant.int 0 %int1_7798 = torch.constant.int 1 %6069 = torch.aten.select.int %6003, %int0_7797, %int1_7798 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7799 = torch.constant.int 0 %int0_7800 = torch.constant.int 0 %6070 = torch.aten.select.int %6069, %int0_7799, %int0_7800 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6071 = torch.prim.ListConstruct %6053, %6066, %6067, %6068 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7801 = torch.constant.bool false %6072 = torch.aten.index_put %6065, %6071, %6070, %false_7801 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7802 = torch.constant.int 2662400 %6073 = torch.prim.ListConstruct %731, %int2662400_7802 : (!torch.int, !torch.int) -> !torch.list %6074 = torch.aten.view %6072, %6073 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7803 = torch.constant.int -1 %int26_7804 = torch.constant.int 26 %int2_7805 = torch.constant.int 2 %int16_7806 = torch.constant.int 16 %int32_7807 = torch.constant.int 32 %int100_7808 = torch.constant.int 100 %6075 = torch.prim.ListConstruct %int-1_7803, %int26_7804, %int2_7805, %int16_7806, %int32_7807, %int100_7808 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6076 = torch.aten.view %6074, %6075 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_7809 = torch.constant.int 0 %int2_7810 = torch.constant.int 2 %6077 = torch.aten.select.int %6018, %int0_7809, %int2_7810 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7811 = torch.constant.int 0 %int2_7812 = torch.constant.int 2 %6078 = torch.aten.select.int %arg3, %int0_7811, %int2_7812 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7813 = torch.constant.int 0 %int0_7814 = torch.constant.int 0 %int9223372036854775807_7815 = torch.constant.int 9223372036854775807 %int1_7816 = torch.constant.int 1 %6079 = torch.aten.slice.Tensor %6078, %int0_7813, %int0_7814, %int9223372036854775807_7815, %int1_7816 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7817 = torch.constant.int 16 %6080 = torch.aten.floor_divide.Scalar %6077, %int16_7817 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7818 = torch.constant.int 0 %6081 = torch.aten.index_select %6079, %int0_7818, %6080 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7819 = torch.constant.int 16 %6082 = torch.aten.remainder.Scalar %6077, %int16_7819 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7820 = torch.constant.none %6083 = torch.aten.clone %566, %none_7820 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7821 = torch.constant.none %6084 = torch.aten.clone %567, %none_7821 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7822 = torch.constant.int 0 %6085 = torch.aten.unsqueeze %6082, %int0_7822 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7823 = torch.constant.int 0 %int2_7824 = torch.constant.int 2 %6086 = torch.aten.select.int %6017, %int0_7823, %int2_7824 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7825 = torch.constant.int 0 %int0_7826 = torch.constant.int 0 %6087 = torch.aten.select.int %6086, %int0_7825, %int0_7826 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6088 = torch.prim.ListConstruct %6081, %6083, %6084, %6085 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7827 = torch.constant.bool false %6089 = torch.aten.index_put %6076, %6088, %6087, %false_7827 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7828 = torch.constant.int 2662400 %6090 = torch.prim.ListConstruct %731, %int2662400_7828 : (!torch.int, !torch.int) -> !torch.list %6091 = torch.aten.view %6089, %6090 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7829 = torch.constant.int -1 %int26_7830 = torch.constant.int 26 %int2_7831 = torch.constant.int 2 %int16_7832 = torch.constant.int 16 %int32_7833 = torch.constant.int 32 %int100_7834 = torch.constant.int 100 %6092 = torch.prim.ListConstruct %int-1_7829, %int26_7830, %int2_7831, %int16_7832, %int32_7833, %int100_7834 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6093 = torch.aten.view %6091, %6092 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7835 = torch.constant.none %6094 = torch.aten.clone %568, %none_7835 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7836 = torch.constant.none %6095 = torch.aten.clone %569, %none_7836 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7837 = torch.constant.int 0 %6096 = torch.aten.unsqueeze %6082, %int0_7837 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7838 = torch.constant.int 0 %int2_7839 = torch.constant.int 2 %6097 = torch.aten.select.int %6003, %int0_7838, %int2_7839 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7840 = torch.constant.int 0 %int0_7841 = torch.constant.int 0 %6098 = torch.aten.select.int %6097, %int0_7840, %int0_7841 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6099 = torch.prim.ListConstruct %6081, %6094, %6095, %6096 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7842 = torch.constant.bool false %6100 = torch.aten.index_put %6093, %6099, %6098, %false_7842 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7843 = torch.constant.int 2662400 %6101 = torch.prim.ListConstruct %731, %int2662400_7843 : (!torch.int, !torch.int) -> !torch.list %6102 = torch.aten.view %6100, %6101 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7844 = torch.constant.int -1 %int26_7845 = torch.constant.int 26 %int2_7846 = torch.constant.int 2 %int16_7847 = torch.constant.int 16 %int32_7848 = torch.constant.int 32 %int100_7849 = torch.constant.int 100 %6103 = torch.prim.ListConstruct %int-1_7844, %int26_7845, %int2_7846, %int16_7847, %int32_7848, %int100_7849 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6104 = torch.aten.view %6102, %6103 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_7850 = torch.constant.int 0 %int3_7851 = torch.constant.int 3 %6105 = torch.aten.select.int %6018, %int0_7850, %int3_7851 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_7852 = torch.constant.int 0 %int3_7853 = torch.constant.int 3 %6106 = torch.aten.select.int %arg3, %int0_7852, %int3_7853 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_7854 = torch.constant.int 0 %int0_7855 = torch.constant.int 0 %int9223372036854775807_7856 = torch.constant.int 9223372036854775807 %int1_7857 = torch.constant.int 1 %6107 = torch.aten.slice.Tensor %6106, %int0_7854, %int0_7855, %int9223372036854775807_7856, %int1_7857 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_7858 = torch.constant.int 16 %6108 = torch.aten.floor_divide.Scalar %6105, %int16_7858 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_7859 = torch.constant.int 0 %6109 = torch.aten.index_select %6107, %int0_7859, %6108 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_7860 = torch.constant.int 16 %6110 = torch.aten.remainder.Scalar %6105, %int16_7860 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_7861 = torch.constant.none %6111 = torch.aten.clone %570, %none_7861 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7862 = torch.constant.none %6112 = torch.aten.clone %571, %none_7862 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7863 = torch.constant.int 0 %6113 = torch.aten.unsqueeze %6110, %int0_7863 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7864 = torch.constant.int 0 %int3_7865 = torch.constant.int 3 %6114 = torch.aten.select.int %6017, %int0_7864, %int3_7865 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7866 = torch.constant.int 0 %int0_7867 = torch.constant.int 0 %6115 = torch.aten.select.int %6114, %int0_7866, %int0_7867 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6116 = torch.prim.ListConstruct %6109, %6111, %6112, %6113 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7868 = torch.constant.bool false %6117 = torch.aten.index_put %6104, %6116, %6115, %false_7868 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7869 = torch.constant.int 2662400 %6118 = torch.prim.ListConstruct %731, %int2662400_7869 : (!torch.int, !torch.int) -> !torch.list %6119 = torch.aten.view %6117, %6118 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_7870 = torch.constant.int -1 %int26_7871 = torch.constant.int 26 %int2_7872 = torch.constant.int 2 %int16_7873 = torch.constant.int 16 %int32_7874 = torch.constant.int 32 %int100_7875 = torch.constant.int 100 %6120 = torch.prim.ListConstruct %int-1_7870, %int26_7871, %int2_7872, %int16_7873, %int32_7874, %int100_7875 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6121 = torch.aten.view %6119, %6120 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_7876 = torch.constant.none %6122 = torch.aten.clone %572, %none_7876 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_7877 = torch.constant.none %6123 = torch.aten.clone %573, %none_7877 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_7878 = torch.constant.int 0 %6124 = torch.aten.unsqueeze %6110, %int0_7878 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_7879 = torch.constant.int 0 %int3_7880 = torch.constant.int 3 %6125 = torch.aten.select.int %6003, %int0_7879, %int3_7880 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_7881 = torch.constant.int 0 %int0_7882 = torch.constant.int 0 %6126 = torch.aten.select.int %6125, %int0_7881, %int0_7882 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6127 = torch.prim.ListConstruct %6109, %6122, %6123, %6124 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_7883 = torch.constant.bool false %6128 = torch.aten.index_put %6121, %6127, %6126, %false_7883 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_7884 = torch.constant.int 2662400 %6129 = torch.prim.ListConstruct %731, %int2662400_7884 : (!torch.int, !torch.int) -> !torch.list %6130 = torch.aten.view %6128, %6129 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_7885 = torch.constant.int 52 %6131 = torch.aten.mul.Scalar %arg3, %int52_7885 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int40 = torch.constant.int 40 %int1_7886 = torch.constant.int 1 %6132 = torch.aten.add.Scalar %6131, %int40, %int1_7886 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_7887 = torch.constant.int 4 %6133 = torch.aten.mul.int %int4_7887, %655 : !torch.int, !torch.int -> !torch.int %6134 = torch.prim.ListConstruct %6133 : (!torch.int) -> !torch.list %6135 = torch.aten.view %6132, %6134 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_7888 = torch.constant.int -1 %int26_7889 = torch.constant.int 26 %int2_7890 = torch.constant.int 2 %int16_7891 = torch.constant.int 16 %int32_7892 = torch.constant.int 32 %int100_7893 = torch.constant.int 100 %6136 = torch.prim.ListConstruct %int-1_7888, %int26_7889, %int2_7890, %int16_7891, %int32_7892, %int100_7893 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6137 = torch.aten.view %6130, %6136 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_7894 = torch.constant.int 26 %6138 = torch.aten.mul.int %731, %int26_7894 : !torch.int, !torch.int -> !torch.int %int2_7895 = torch.constant.int 2 %6139 = torch.aten.mul.int %6138, %int2_7895 : !torch.int, !torch.int -> !torch.int %int16_7896 = torch.constant.int 16 %int32_7897 = torch.constant.int 32 %int100_7898 = torch.constant.int 100 %6140 = torch.prim.ListConstruct %6139, %int16_7896, %int32_7897, %int100_7898 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6141 = torch.aten.view %6137, %6140 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_7899 = torch.constant.int 0 %6142 = torch.aten.index_select %6141, %int0_7899, %6135 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_7900 = torch.constant.int 4 %int16_7901 = torch.constant.int 16 %int32_7902 = torch.constant.int 32 %int100_7903 = torch.constant.int 100 %6143 = torch.prim.ListConstruct %int4_7900, %655, %int16_7901, %int32_7902, %int100_7903 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6144 = torch.aten.view %6142, %6143 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_7904 = torch.constant.int 1 %6145 = torch.aten.size.int %6144, %int1_7904 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_7905 = torch.constant.int 16 %6146 = torch.aten.mul.int %6145, %int16_7905 : !torch.int, !torch.int -> !torch.int %int4_7906 = torch.constant.int 4 %int32_7907 = torch.constant.int 32 %int100_7908 = torch.constant.int 100 %6147 = torch.prim.ListConstruct %int4_7906, %6146, %int32_7907, %int100_7908 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6148 = torch.aten.view %6144, %6147 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_7909 = torch.constant.int 0 %int0_7910 = torch.constant.int 0 %int9223372036854775807_7911 = torch.constant.int 9223372036854775807 %int1_7912 = torch.constant.int 1 %6149 = torch.aten.slice.Tensor %5890, %int0_7909, %int0_7910, %int9223372036854775807_7911, %int1_7912 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_7913 = torch.constant.int 16 %6150 = torch.aten.mul.int %655, %int16_7913 : !torch.int, !torch.int -> !torch.int %int1_7914 = torch.constant.int 1 %int0_7915 = torch.constant.int 0 %int1_7916 = torch.constant.int 1 %6151 = torch.aten.slice.Tensor %6149, %int1_7914, %int0_7915, %6150, %int1_7916 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_7917 = torch.constant.bool false %6152 = torch.aten.copy %6151, %6148, %false_7917 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_7918 = torch.constant.int 0 %int0_7919 = torch.constant.int 0 %int9223372036854775807_7920 = torch.constant.int 9223372036854775807 %int1_7921 = torch.constant.int 1 %6153 = torch.aten.slice.Tensor %5890, %int0_7918, %int0_7919, %int9223372036854775807_7920, %int1_7921 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7922 = torch.constant.int 1 %int0_7923 = torch.constant.int 0 %int1_7924 = torch.constant.int 1 %6154 = torch.aten.slice_scatter %6153, %6152, %int1_7922, %int0_7923, %6150, %int1_7924 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_7925 = torch.constant.int 0 %int0_7926 = torch.constant.int 0 %int9223372036854775807_7927 = torch.constant.int 9223372036854775807 %int1_7928 = torch.constant.int 1 %6155 = torch.aten.slice_scatter %5890, %6154, %int0_7925, %int0_7926, %int9223372036854775807_7927, %int1_7928 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7929 = torch.constant.int 1 %int1_7930 = torch.constant.int 1 %6156 = torch.aten.add.Scalar %6132, %int1_7929, %int1_7930 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_7931 = torch.constant.int 4 %6157 = torch.aten.mul.int %int4_7931, %655 : !torch.int, !torch.int -> !torch.int %6158 = torch.prim.ListConstruct %6157 : (!torch.int) -> !torch.list %6159 = torch.aten.view %6156, %6158 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_7932 = torch.constant.int 0 %6160 = torch.aten.index_select %6141, %int0_7932, %6159 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_7933 = torch.constant.int 4 %int16_7934 = torch.constant.int 16 %int32_7935 = torch.constant.int 32 %int100_7936 = torch.constant.int 100 %6161 = torch.prim.ListConstruct %int4_7933, %655, %int16_7934, %int32_7935, %int100_7936 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6162 = torch.aten.view %6160, %6161 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_7937 = torch.constant.int 1 %6163 = torch.aten.size.int %6162, %int1_7937 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_7938 = torch.constant.int 16 %6164 = torch.aten.mul.int %6163, %int16_7938 : !torch.int, !torch.int -> !torch.int %int4_7939 = torch.constant.int 4 %int32_7940 = torch.constant.int 32 %int100_7941 = torch.constant.int 100 %6165 = torch.prim.ListConstruct %int4_7939, %6164, %int32_7940, %int100_7941 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6166 = torch.aten.view %6162, %6165 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_7942 = torch.constant.int 0 %int0_7943 = torch.constant.int 0 %int9223372036854775807_7944 = torch.constant.int 9223372036854775807 %int1_7945 = torch.constant.int 1 %6167 = torch.aten.slice.Tensor %5907, %int0_7942, %int0_7943, %int9223372036854775807_7944, %int1_7945 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7946 = torch.constant.int 1 %int0_7947 = torch.constant.int 0 %int1_7948 = torch.constant.int 1 %6168 = torch.aten.slice.Tensor %6167, %int1_7946, %int0_7947, %6150, %int1_7948 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_7949 = torch.constant.bool false %6169 = torch.aten.copy %6168, %6166, %false_7949 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_7950 = torch.constant.int 0 %int0_7951 = torch.constant.int 0 %int9223372036854775807_7952 = torch.constant.int 9223372036854775807 %int1_7953 = torch.constant.int 1 %6170 = torch.aten.slice.Tensor %5907, %int0_7950, %int0_7951, %int9223372036854775807_7952, %int1_7953 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7954 = torch.constant.int 1 %int0_7955 = torch.constant.int 0 %int1_7956 = torch.constant.int 1 %6171 = torch.aten.slice_scatter %6170, %6169, %int1_7954, %int0_7955, %6150, %int1_7956 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_7957 = torch.constant.int 0 %int0_7958 = torch.constant.int 0 %int9223372036854775807_7959 = torch.constant.int 9223372036854775807 %int1_7960 = torch.constant.int 1 %6172 = torch.aten.slice_scatter %5907, %6171, %int0_7957, %int0_7958, %int9223372036854775807_7959, %int1_7960 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_7961 = torch.constant.int 0 %int0_7962 = torch.constant.int 0 %int9223372036854775807_7963 = torch.constant.int 9223372036854775807 %int1_7964 = torch.constant.int 1 %6173 = torch.aten.slice.Tensor %671, %int0_7961, %int0_7962, %int9223372036854775807_7963, %int1_7964 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7965 = torch.constant.int 1 %int0_7966 = torch.constant.int 0 %int1_7967 = torch.constant.int 1 %6174 = torch.aten.slice.Tensor %6173, %int1_7965, %int0_7966, %6150, %int1_7967 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_7968 = torch.constant.int 0 %int0_7969 = torch.constant.int 0 %int9223372036854775807_7970 = torch.constant.int 9223372036854775807 %int1_7971 = torch.constant.int 1 %6175 = torch.aten.slice.Tensor %673, %int0_7968, %int0_7969, %int9223372036854775807_7970, %int1_7971 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7972 = torch.constant.int 1 %int0_7973 = torch.constant.int 0 %int1_7974 = torch.constant.int 1 %6176 = torch.aten.slice.Tensor %6175, %int1_7972, %int0_7973, %6150, %int1_7974 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_7975 = torch.constant.int 1 %int2_7976 = torch.constant.int 2 %6177 = torch.aten.transpose.int %6013, %int1_7975, %int2_7976 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_7977 = torch.constant.int 4 %int32_7978 = torch.constant.int 32 %int1_7979 = torch.constant.int 1 %int100_7980 = torch.constant.int 100 %6178 = torch.prim.ListConstruct %int4_7977, %int32_7978, %int1_7979, %int100_7980 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_7981 = torch.constant.bool false %6179 = torch.aten.expand %6177, %6178, %false_7981 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_7982 = torch.constant.int 128 %int1_7983 = torch.constant.int 1 %int100_7984 = torch.constant.int 100 %6180 = torch.prim.ListConstruct %int128_7982, %int1_7983, %int100_7984 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6181 = torch.aten.view %6179, %6180 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_7985 = torch.constant.int 0 %int0_7986 = torch.constant.int 0 %int9223372036854775807_7987 = torch.constant.int 9223372036854775807 %int1_7988 = torch.constant.int 1 %6182 = torch.aten.slice.Tensor %6155, %int0_7985, %int0_7986, %int9223372036854775807_7987, %int1_7988 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_7989 = torch.constant.int 1 %int0_7990 = torch.constant.int 0 %int1_7991 = torch.constant.int 1 %6183 = torch.aten.slice.Tensor %6182, %int1_7989, %int0_7990, %6150, %int1_7991 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_7992 = torch.constant.int 1 %int2_7993 = torch.constant.int 2 %6184 = torch.aten.transpose.int %6183, %int1_7992, %int2_7993 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_7994 = torch.constant.int 2 %int3_7995 = torch.constant.int 3 %6185 = torch.aten.transpose.int %6184, %int2_7994, %int3_7995 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_7996 = torch.constant.int 1 %6186 = torch.aten.size.int %6174, %int1_7996 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_7997 = torch.constant.int 4 %int32_7998 = torch.constant.int 32 %int100_7999 = torch.constant.int 100 %6187 = torch.prim.ListConstruct %int4_7997, %int32_7998, %int100_7999, %6186 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8000 = torch.constant.bool false %6188 = torch.aten.expand %6185, %6187, %false_8000 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_8001 = torch.constant.int 0 %6189 = torch.aten.clone %6188, %int0_8001 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_8002 = torch.constant.int 128 %int100_8003 = torch.constant.int 100 %6190 = torch.prim.ListConstruct %int128_8002, %int100_8003, %6186 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6191 = torch.aten._unsafe_view %6189, %6190 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %6192 = torch.aten.bmm %6181, %6191 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_8004 = torch.constant.int 4 %int32_8005 = torch.constant.int 32 %int1_8006 = torch.constant.int 1 %6193 = torch.prim.ListConstruct %int4_8004, %int32_8005, %int1_8006, %6186 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6194 = torch.aten.view %6192, %6193 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_8007 = torch.constant.float 1.000000e+01 %6195 = torch.aten.div.Scalar %6194, %float1.000000e01_8007 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_8008 = torch.constant.int 1 %6196 = torch.aten.add.Tensor %6195, %895, %int1_8008 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_8009 = torch.constant.int -1 %false_8010 = torch.constant.bool false %6197 = torch.aten._softmax %6196, %int-1_8009, %false_8010 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_8011 = torch.constant.int 4 %int32_8012 = torch.constant.int 32 %int1_8013 = torch.constant.int 1 %6198 = torch.prim.ListConstruct %int4_8011, %int32_8012, %int1_8013, %6186 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8014 = torch.constant.bool false %6199 = torch.aten.expand %6197, %6198, %false_8014 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_8015 = torch.constant.int 128 %int1_8016 = torch.constant.int 1 %6200 = torch.prim.ListConstruct %int128_8015, %int1_8016, %6186 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6201 = torch.aten.view %6199, %6200 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_8017 = torch.constant.int 0 %int0_8018 = torch.constant.int 0 %int9223372036854775807_8019 = torch.constant.int 9223372036854775807 %int1_8020 = torch.constant.int 1 %6202 = torch.aten.slice.Tensor %6172, %int0_8017, %int0_8018, %int9223372036854775807_8019, %int1_8020 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8021 = torch.constant.int 1 %int0_8022 = torch.constant.int 0 %int1_8023 = torch.constant.int 1 %6203 = torch.aten.slice.Tensor %6202, %int1_8021, %int0_8022, %6150, %int1_8023 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_8024 = torch.constant.int 1 %int2_8025 = torch.constant.int 2 %6204 = torch.aten.transpose.int %6203, %int1_8024, %int2_8025 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_8026 = torch.constant.int 1 %6205 = torch.aten.size.int %6176, %int1_8026 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_8027 = torch.constant.int 4 %int32_8028 = torch.constant.int 32 %int100_8029 = torch.constant.int 100 %6206 = torch.prim.ListConstruct %int4_8027, %int32_8028, %6205, %int100_8029 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8030 = torch.constant.bool false %6207 = torch.aten.expand %6204, %6206, %false_8030 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_8031 = torch.constant.int 0 %6208 = torch.aten.clone %6207, %int0_8031 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_8032 = torch.constant.int 128 %int100_8033 = torch.constant.int 100 %6209 = torch.prim.ListConstruct %int128_8032, %6205, %int100_8033 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6210 = torch.aten._unsafe_view %6208, %6209 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %6211 = torch.aten.bmm %6201, %6210 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_8034 = torch.constant.int 4 %int32_8035 = torch.constant.int 32 %int1_8036 = torch.constant.int 1 %int100_8037 = torch.constant.int 100 %6212 = torch.prim.ListConstruct %int4_8034, %int32_8035, %int1_8036, %int100_8037 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6213 = torch.aten.view %6211, %6212 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_8038 = torch.constant.int 1 %int2_8039 = torch.constant.int 2 %6214 = torch.aten.transpose.int %6213, %int1_8038, %int2_8039 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_8040 = torch.constant.int 4 %int1_8041 = torch.constant.int 1 %int-1_8042 = torch.constant.int -1 %6215 = torch.prim.ListConstruct %int4_8040, %int1_8041, %int-1_8042 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6216 = torch.aten.view %6214, %6215 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %6217 = torch_c.to_builtin_tensor %6216 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8043 = tensor.cast %6217 : tensor<4x1x3200xf32> to tensor %6218 = torch_c.to_builtin_tensor %186 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6219 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8043, %6218) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8044 = tensor.cast %6219 : tensor to tensor<4x1x3200xf32> %6220 = torch_c.from_builtin_tensor %cast_8044 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_8045 = torch.constant.int 1 %6221 = torch.aten.add.Tensor %5978, %6220, %int1_8045 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_8046 = torch.constant.int 2 %6222 = torch.aten.pow.Tensor_Scalar %6221, %int2_8046 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_8047 = torch.constant.int -1 %6223 = torch.prim.ListConstruct %int-1_8047 : (!torch.int) -> !torch.list %true_8048 = torch.constant.bool true %none_8049 = torch.constant.none %6224 = torch.aten.mean.dim %6222, %6223, %true_8048, %none_8049 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_8050 = torch.constant.float 9.9999999747524271E-7 %int1_8051 = torch.constant.int 1 %6225 = torch.aten.add.Scalar %6224, %float9.999990e-07_8050, %int1_8051 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %6226 = torch.aten.rsqrt %6225 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %6227 = torch.aten.mul.Tensor %6221, %6226 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %6228 = torch.aten.mul.Tensor %6227, %187 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %6229 = torch_c.to_builtin_tensor %6228 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8052 = tensor.cast %6229 : tensor<4x1x3200xf32> to tensor %6230 = torch_c.to_builtin_tensor %188 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %6231 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_8052, %6230) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_8053 = tensor.cast %6231 : tensor to tensor<4x1x8640xf32> %6232 = torch_c.from_builtin_tensor %cast_8053 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %6233 = torch.aten.silu %6232 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %6234 = torch_c.to_builtin_tensor %6228 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8054 = tensor.cast %6234 : tensor<4x1x3200xf32> to tensor %6235 = torch_c.to_builtin_tensor %189 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %6236 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_8054, %6235) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_8055 = tensor.cast %6236 : tensor to tensor<4x1x8640xf32> %6237 = torch_c.from_builtin_tensor %cast_8055 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %6238 = torch.aten.mul.Tensor %6233, %6237 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %6239 = torch_c.to_builtin_tensor %6238 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_8056 = tensor.cast %6239 : tensor<4x1x8640xf32> to tensor %6240 = torch_c.to_builtin_tensor %190 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %6241 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_8056, %6240) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_8057 = tensor.cast %6241 : tensor to tensor<4x1x3200xf32> %6242 = torch_c.from_builtin_tensor %cast_8057 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_8058 = torch.constant.int 1 %6243 = torch.aten.add.Tensor %6221, %6242, %int1_8058 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_8059 = torch.constant.int 2 %6244 = torch.aten.pow.Tensor_Scalar %6243, %int2_8059 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_8060 = torch.constant.int -1 %6245 = torch.prim.ListConstruct %int-1_8060 : (!torch.int) -> !torch.list %true_8061 = torch.constant.bool true %none_8062 = torch.constant.none %6246 = torch.aten.mean.dim %6244, %6245, %true_8061, %none_8062 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_8063 = torch.constant.float 9.9999999747524271E-7 %int1_8064 = torch.constant.int 1 %6247 = torch.aten.add.Scalar %6246, %float9.999990e-07_8063, %int1_8064 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %6248 = torch.aten.rsqrt %6247 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %6249 = torch.aten.mul.Tensor %6243, %6248 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %6250 = torch.aten.mul.Tensor %6249, %191 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %6251 = torch_c.to_builtin_tensor %6250 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8065 = tensor.cast %6251 : tensor<4x1x3200xf32> to tensor %6252 = torch_c.to_builtin_tensor %192 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6253 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8065, %6252) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8066 = tensor.cast %6253 : tensor to tensor<4x1x3200xf32> %6254 = torch_c.from_builtin_tensor %cast_8066 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %6255 = torch_c.to_builtin_tensor %6250 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8067 = tensor.cast %6255 : tensor<4x1x3200xf32> to tensor %6256 = torch_c.to_builtin_tensor %193 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6257 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8067, %6256) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8068 = tensor.cast %6257 : tensor to tensor<4x1x3200xf32> %6258 = torch_c.from_builtin_tensor %cast_8068 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %6259 = torch_c.to_builtin_tensor %6250 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8069 = tensor.cast %6259 : tensor<4x1x3200xf32> to tensor %6260 = torch_c.to_builtin_tensor %194 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6261 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8069, %6260) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8070 = tensor.cast %6261 : tensor to tensor<4x1x3200xf32> %6262 = torch_c.from_builtin_tensor %cast_8070 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_8071 = torch.constant.int 4 %int1_8072 = torch.constant.int 1 %int32_8073 = torch.constant.int 32 %int100_8074 = torch.constant.int 100 %6263 = torch.prim.ListConstruct %int4_8071, %int1_8072, %int32_8073, %int100_8074 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6264 = torch.aten.view %6254, %6263 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_8075 = torch.constant.int 4 %int1_8076 = torch.constant.int 1 %int32_8077 = torch.constant.int 32 %int100_8078 = torch.constant.int 100 %6265 = torch.prim.ListConstruct %int4_8075, %int1_8076, %int32_8077, %int100_8078 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6266 = torch.aten.view %6258, %6265 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_8079 = torch.constant.int 4 %int1_8080 = torch.constant.int 1 %int32_8081 = torch.constant.int 32 %int100_8082 = torch.constant.int 100 %6267 = torch.prim.ListConstruct %int4_8079, %int1_8080, %int32_8081, %int100_8082 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6268 = torch.aten.view %6262, %6267 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_8083 = torch.constant.int 4 %int1_8084 = torch.constant.int 1 %int32_8085 = torch.constant.int 32 %int-1_8086 = torch.constant.int -1 %int2_8087 = torch.constant.int 2 %6269 = torch.prim.ListConstruct %int4_8083, %int1_8084, %int32_8085, %int-1_8086, %int2_8087 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6270 = torch.aten.view %6264, %6269 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %6271 = torch.aten.view_as_complex %6270 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_8088 = torch.constant.int 4 %int1_8089 = torch.constant.int 1 %int32_8090 = torch.constant.int 32 %int-1_8091 = torch.constant.int -1 %int2_8092 = torch.constant.int 2 %6272 = torch.prim.ListConstruct %int4_8088, %int1_8089, %int32_8090, %int-1_8091, %int2_8092 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6273 = torch.aten.view %6266, %6272 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %6274 = torch.aten.view_as_complex %6273 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %6275 = torch.aten.mul.Tensor %6271, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %6276 = torch.aten.view_as_real %6275 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_8093 = torch.constant.int 4 %int1_8094 = torch.constant.int 1 %int32_8095 = torch.constant.int 32 %int100_8096 = torch.constant.int 100 %6277 = torch.prim.ListConstruct %int4_8093, %int1_8094, %int32_8095, %int100_8096 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6278 = torch.aten.view %6276, %6277 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %6279 = torch.aten.mul.Tensor %6274, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %6280 = torch.aten.view_as_real %6279 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_8097 = torch.constant.int 4 %int1_8098 = torch.constant.int 1 %int32_8099 = torch.constant.int 32 %int100_8100 = torch.constant.int 100 %6281 = torch.prim.ListConstruct %int4_8097, %int1_8098, %int32_8099, %int100_8100 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6282 = torch.aten.view %6280, %6281 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_8101 = torch.constant.int 1 %int1_8102 = torch.constant.int 1 %6283 = torch.aten.add.Scalar %arg2, %int1_8101, %int1_8102 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_8103 = torch.constant.int 0 %int0_8104 = torch.constant.int 0 %6284 = torch.aten.select.int %6283, %int0_8103, %int0_8104 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8105 = torch.constant.int 0 %int0_8106 = torch.constant.int 0 %6285 = torch.aten.select.int %arg3, %int0_8105, %int0_8106 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8107 = torch.constant.int 0 %int0_8108 = torch.constant.int 0 %int9223372036854775807_8109 = torch.constant.int 9223372036854775807 %int1_8110 = torch.constant.int 1 %6286 = torch.aten.slice.Tensor %6285, %int0_8107, %int0_8108, %int9223372036854775807_8109, %int1_8110 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8111 = torch.constant.int 16 %6287 = torch.aten.floor_divide.Scalar %6284, %int16_8111 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8112 = torch.constant.int 0 %6288 = torch.aten.index_select %6286, %int0_8112, %6287 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8113 = torch.constant.int 16 %6289 = torch.aten.remainder.Scalar %6284, %int16_8113 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8114 = torch.constant.none %6290 = torch.aten.clone %574, %none_8114 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8115 = torch.constant.none %6291 = torch.aten.clone %575, %none_8115 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8116 = torch.constant.int 0 %6292 = torch.aten.unsqueeze %6289, %int0_8116 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8117 = torch.constant.int 0 %int0_8118 = torch.constant.int 0 %6293 = torch.aten.select.int %6282, %int0_8117, %int0_8118 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8119 = torch.constant.int 0 %int0_8120 = torch.constant.int 0 %6294 = torch.aten.select.int %6293, %int0_8119, %int0_8120 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_8121 = torch.constant.int -1 %int26_8122 = torch.constant.int 26 %int2_8123 = torch.constant.int 2 %int16_8124 = torch.constant.int 16 %int32_8125 = torch.constant.int 32 %int100_8126 = torch.constant.int 100 %6295 = torch.prim.ListConstruct %int-1_8121, %int26_8122, %int2_8123, %int16_8124, %int32_8125, %int100_8126 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6296 = torch.aten.view %6130, %6295 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %6297 = torch.prim.ListConstruct %6288, %6290, %6291, %6292 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8127 = torch.constant.bool false %6298 = torch.aten.index_put %6296, %6297, %6294, %false_8127 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8128 = torch.constant.int 2662400 %6299 = torch.prim.ListConstruct %731, %int2662400_8128 : (!torch.int, !torch.int) -> !torch.list %6300 = torch.aten.view %6298, %6299 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8129 = torch.constant.int -1 %int26_8130 = torch.constant.int 26 %int2_8131 = torch.constant.int 2 %int16_8132 = torch.constant.int 16 %int32_8133 = torch.constant.int 32 %int100_8134 = torch.constant.int 100 %6301 = torch.prim.ListConstruct %int-1_8129, %int26_8130, %int2_8131, %int16_8132, %int32_8133, %int100_8134 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6302 = torch.aten.view %6300, %6301 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8135 = torch.constant.none %6303 = torch.aten.clone %576, %none_8135 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8136 = torch.constant.none %6304 = torch.aten.clone %577, %none_8136 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8137 = torch.constant.int 0 %6305 = torch.aten.unsqueeze %6289, %int0_8137 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8138 = torch.constant.int 0 %int0_8139 = torch.constant.int 0 %6306 = torch.aten.select.int %6268, %int0_8138, %int0_8139 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8140 = torch.constant.int 0 %int0_8141 = torch.constant.int 0 %6307 = torch.aten.select.int %6306, %int0_8140, %int0_8141 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6308 = torch.prim.ListConstruct %6288, %6303, %6304, %6305 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8142 = torch.constant.bool false %6309 = torch.aten.index_put %6302, %6308, %6307, %false_8142 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8143 = torch.constant.int 2662400 %6310 = torch.prim.ListConstruct %731, %int2662400_8143 : (!torch.int, !torch.int) -> !torch.list %6311 = torch.aten.view %6309, %6310 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8144 = torch.constant.int -1 %int26_8145 = torch.constant.int 26 %int2_8146 = torch.constant.int 2 %int16_8147 = torch.constant.int 16 %int32_8148 = torch.constant.int 32 %int100_8149 = torch.constant.int 100 %6312 = torch.prim.ListConstruct %int-1_8144, %int26_8145, %int2_8146, %int16_8147, %int32_8148, %int100_8149 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6313 = torch.aten.view %6311, %6312 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_8150 = torch.constant.int 0 %int1_8151 = torch.constant.int 1 %6314 = torch.aten.select.int %6283, %int0_8150, %int1_8151 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8152 = torch.constant.int 0 %int1_8153 = torch.constant.int 1 %6315 = torch.aten.select.int %arg3, %int0_8152, %int1_8153 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8154 = torch.constant.int 0 %int0_8155 = torch.constant.int 0 %int9223372036854775807_8156 = torch.constant.int 9223372036854775807 %int1_8157 = torch.constant.int 1 %6316 = torch.aten.slice.Tensor %6315, %int0_8154, %int0_8155, %int9223372036854775807_8156, %int1_8157 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8158 = torch.constant.int 16 %6317 = torch.aten.floor_divide.Scalar %6314, %int16_8158 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8159 = torch.constant.int 0 %6318 = torch.aten.index_select %6316, %int0_8159, %6317 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8160 = torch.constant.int 16 %6319 = torch.aten.remainder.Scalar %6314, %int16_8160 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8161 = torch.constant.none %6320 = torch.aten.clone %578, %none_8161 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8162 = torch.constant.none %6321 = torch.aten.clone %579, %none_8162 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8163 = torch.constant.int 0 %6322 = torch.aten.unsqueeze %6319, %int0_8163 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8164 = torch.constant.int 0 %int1_8165 = torch.constant.int 1 %6323 = torch.aten.select.int %6282, %int0_8164, %int1_8165 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8166 = torch.constant.int 0 %int0_8167 = torch.constant.int 0 %6324 = torch.aten.select.int %6323, %int0_8166, %int0_8167 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6325 = torch.prim.ListConstruct %6318, %6320, %6321, %6322 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8168 = torch.constant.bool false %6326 = torch.aten.index_put %6313, %6325, %6324, %false_8168 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8169 = torch.constant.int 2662400 %6327 = torch.prim.ListConstruct %731, %int2662400_8169 : (!torch.int, !torch.int) -> !torch.list %6328 = torch.aten.view %6326, %6327 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8170 = torch.constant.int -1 %int26_8171 = torch.constant.int 26 %int2_8172 = torch.constant.int 2 %int16_8173 = torch.constant.int 16 %int32_8174 = torch.constant.int 32 %int100_8175 = torch.constant.int 100 %6329 = torch.prim.ListConstruct %int-1_8170, %int26_8171, %int2_8172, %int16_8173, %int32_8174, %int100_8175 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6330 = torch.aten.view %6328, %6329 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8176 = torch.constant.none %6331 = torch.aten.clone %580, %none_8176 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8177 = torch.constant.none %6332 = torch.aten.clone %581, %none_8177 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8178 = torch.constant.int 0 %6333 = torch.aten.unsqueeze %6319, %int0_8178 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8179 = torch.constant.int 0 %int1_8180 = torch.constant.int 1 %6334 = torch.aten.select.int %6268, %int0_8179, %int1_8180 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8181 = torch.constant.int 0 %int0_8182 = torch.constant.int 0 %6335 = torch.aten.select.int %6334, %int0_8181, %int0_8182 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6336 = torch.prim.ListConstruct %6318, %6331, %6332, %6333 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8183 = torch.constant.bool false %6337 = torch.aten.index_put %6330, %6336, %6335, %false_8183 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8184 = torch.constant.int 2662400 %6338 = torch.prim.ListConstruct %731, %int2662400_8184 : (!torch.int, !torch.int) -> !torch.list %6339 = torch.aten.view %6337, %6338 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8185 = torch.constant.int -1 %int26_8186 = torch.constant.int 26 %int2_8187 = torch.constant.int 2 %int16_8188 = torch.constant.int 16 %int32_8189 = torch.constant.int 32 %int100_8190 = torch.constant.int 100 %6340 = torch.prim.ListConstruct %int-1_8185, %int26_8186, %int2_8187, %int16_8188, %int32_8189, %int100_8190 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6341 = torch.aten.view %6339, %6340 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_8191 = torch.constant.int 0 %int2_8192 = torch.constant.int 2 %6342 = torch.aten.select.int %6283, %int0_8191, %int2_8192 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8193 = torch.constant.int 0 %int2_8194 = torch.constant.int 2 %6343 = torch.aten.select.int %arg3, %int0_8193, %int2_8194 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8195 = torch.constant.int 0 %int0_8196 = torch.constant.int 0 %int9223372036854775807_8197 = torch.constant.int 9223372036854775807 %int1_8198 = torch.constant.int 1 %6344 = torch.aten.slice.Tensor %6343, %int0_8195, %int0_8196, %int9223372036854775807_8197, %int1_8198 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8199 = torch.constant.int 16 %6345 = torch.aten.floor_divide.Scalar %6342, %int16_8199 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8200 = torch.constant.int 0 %6346 = torch.aten.index_select %6344, %int0_8200, %6345 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8201 = torch.constant.int 16 %6347 = torch.aten.remainder.Scalar %6342, %int16_8201 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8202 = torch.constant.none %6348 = torch.aten.clone %582, %none_8202 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8203 = torch.constant.none %6349 = torch.aten.clone %583, %none_8203 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8204 = torch.constant.int 0 %6350 = torch.aten.unsqueeze %6347, %int0_8204 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8205 = torch.constant.int 0 %int2_8206 = torch.constant.int 2 %6351 = torch.aten.select.int %6282, %int0_8205, %int2_8206 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8207 = torch.constant.int 0 %int0_8208 = torch.constant.int 0 %6352 = torch.aten.select.int %6351, %int0_8207, %int0_8208 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6353 = torch.prim.ListConstruct %6346, %6348, %6349, %6350 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8209 = torch.constant.bool false %6354 = torch.aten.index_put %6341, %6353, %6352, %false_8209 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8210 = torch.constant.int 2662400 %6355 = torch.prim.ListConstruct %731, %int2662400_8210 : (!torch.int, !torch.int) -> !torch.list %6356 = torch.aten.view %6354, %6355 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8211 = torch.constant.int -1 %int26_8212 = torch.constant.int 26 %int2_8213 = torch.constant.int 2 %int16_8214 = torch.constant.int 16 %int32_8215 = torch.constant.int 32 %int100_8216 = torch.constant.int 100 %6357 = torch.prim.ListConstruct %int-1_8211, %int26_8212, %int2_8213, %int16_8214, %int32_8215, %int100_8216 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6358 = torch.aten.view %6356, %6357 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8217 = torch.constant.none %6359 = torch.aten.clone %584, %none_8217 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8218 = torch.constant.none %6360 = torch.aten.clone %585, %none_8218 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8219 = torch.constant.int 0 %6361 = torch.aten.unsqueeze %6347, %int0_8219 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8220 = torch.constant.int 0 %int2_8221 = torch.constant.int 2 %6362 = torch.aten.select.int %6268, %int0_8220, %int2_8221 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8222 = torch.constant.int 0 %int0_8223 = torch.constant.int 0 %6363 = torch.aten.select.int %6362, %int0_8222, %int0_8223 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6364 = torch.prim.ListConstruct %6346, %6359, %6360, %6361 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8224 = torch.constant.bool false %6365 = torch.aten.index_put %6358, %6364, %6363, %false_8224 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8225 = torch.constant.int 2662400 %6366 = torch.prim.ListConstruct %731, %int2662400_8225 : (!torch.int, !torch.int) -> !torch.list %6367 = torch.aten.view %6365, %6366 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8226 = torch.constant.int -1 %int26_8227 = torch.constant.int 26 %int2_8228 = torch.constant.int 2 %int16_8229 = torch.constant.int 16 %int32_8230 = torch.constant.int 32 %int100_8231 = torch.constant.int 100 %6368 = torch.prim.ListConstruct %int-1_8226, %int26_8227, %int2_8228, %int16_8229, %int32_8230, %int100_8231 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6369 = torch.aten.view %6367, %6368 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_8232 = torch.constant.int 0 %int3_8233 = torch.constant.int 3 %6370 = torch.aten.select.int %6283, %int0_8232, %int3_8233 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8234 = torch.constant.int 0 %int3_8235 = torch.constant.int 3 %6371 = torch.aten.select.int %arg3, %int0_8234, %int3_8235 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8236 = torch.constant.int 0 %int0_8237 = torch.constant.int 0 %int9223372036854775807_8238 = torch.constant.int 9223372036854775807 %int1_8239 = torch.constant.int 1 %6372 = torch.aten.slice.Tensor %6371, %int0_8236, %int0_8237, %int9223372036854775807_8238, %int1_8239 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8240 = torch.constant.int 16 %6373 = torch.aten.floor_divide.Scalar %6370, %int16_8240 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8241 = torch.constant.int 0 %6374 = torch.aten.index_select %6372, %int0_8241, %6373 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8242 = torch.constant.int 16 %6375 = torch.aten.remainder.Scalar %6370, %int16_8242 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8243 = torch.constant.none %6376 = torch.aten.clone %586, %none_8243 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8244 = torch.constant.none %6377 = torch.aten.clone %587, %none_8244 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8245 = torch.constant.int 0 %6378 = torch.aten.unsqueeze %6375, %int0_8245 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8246 = torch.constant.int 0 %int3_8247 = torch.constant.int 3 %6379 = torch.aten.select.int %6282, %int0_8246, %int3_8247 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8248 = torch.constant.int 0 %int0_8249 = torch.constant.int 0 %6380 = torch.aten.select.int %6379, %int0_8248, %int0_8249 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6381 = torch.prim.ListConstruct %6374, %6376, %6377, %6378 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8250 = torch.constant.bool false %6382 = torch.aten.index_put %6369, %6381, %6380, %false_8250 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8251 = torch.constant.int 2662400 %6383 = torch.prim.ListConstruct %731, %int2662400_8251 : (!torch.int, !torch.int) -> !torch.list %6384 = torch.aten.view %6382, %6383 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8252 = torch.constant.int -1 %int26_8253 = torch.constant.int 26 %int2_8254 = torch.constant.int 2 %int16_8255 = torch.constant.int 16 %int32_8256 = torch.constant.int 32 %int100_8257 = torch.constant.int 100 %6385 = torch.prim.ListConstruct %int-1_8252, %int26_8253, %int2_8254, %int16_8255, %int32_8256, %int100_8257 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6386 = torch.aten.view %6384, %6385 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8258 = torch.constant.none %6387 = torch.aten.clone %588, %none_8258 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8259 = torch.constant.none %6388 = torch.aten.clone %589, %none_8259 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8260 = torch.constant.int 0 %6389 = torch.aten.unsqueeze %6375, %int0_8260 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8261 = torch.constant.int 0 %int3_8262 = torch.constant.int 3 %6390 = torch.aten.select.int %6268, %int0_8261, %int3_8262 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8263 = torch.constant.int 0 %int0_8264 = torch.constant.int 0 %6391 = torch.aten.select.int %6390, %int0_8263, %int0_8264 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6392 = torch.prim.ListConstruct %6374, %6387, %6388, %6389 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8265 = torch.constant.bool false %6393 = torch.aten.index_put %6386, %6392, %6391, %false_8265 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8266 = torch.constant.int 2662400 %6394 = torch.prim.ListConstruct %731, %int2662400_8266 : (!torch.int, !torch.int) -> !torch.list %6395 = torch.aten.view %6393, %6394 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_8267 = torch.constant.int 52 %6396 = torch.aten.mul.Scalar %arg3, %int52_8267 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int42 = torch.constant.int 42 %int1_8268 = torch.constant.int 1 %6397 = torch.aten.add.Scalar %6396, %int42, %int1_8268 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_8269 = torch.constant.int 4 %6398 = torch.aten.mul.int %int4_8269, %655 : !torch.int, !torch.int -> !torch.int %6399 = torch.prim.ListConstruct %6398 : (!torch.int) -> !torch.list %6400 = torch.aten.view %6397, %6399 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_8270 = torch.constant.int -1 %int26_8271 = torch.constant.int 26 %int2_8272 = torch.constant.int 2 %int16_8273 = torch.constant.int 16 %int32_8274 = torch.constant.int 32 %int100_8275 = torch.constant.int 100 %6401 = torch.prim.ListConstruct %int-1_8270, %int26_8271, %int2_8272, %int16_8273, %int32_8274, %int100_8275 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6402 = torch.aten.view %6395, %6401 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_8276 = torch.constant.int 26 %6403 = torch.aten.mul.int %731, %int26_8276 : !torch.int, !torch.int -> !torch.int %int2_8277 = torch.constant.int 2 %6404 = torch.aten.mul.int %6403, %int2_8277 : !torch.int, !torch.int -> !torch.int %int16_8278 = torch.constant.int 16 %int32_8279 = torch.constant.int 32 %int100_8280 = torch.constant.int 100 %6405 = torch.prim.ListConstruct %6404, %int16_8278, %int32_8279, %int100_8280 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6406 = torch.aten.view %6402, %6405 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_8281 = torch.constant.int 0 %6407 = torch.aten.index_select %6406, %int0_8281, %6400 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_8282 = torch.constant.int 4 %int16_8283 = torch.constant.int 16 %int32_8284 = torch.constant.int 32 %int100_8285 = torch.constant.int 100 %6408 = torch.prim.ListConstruct %int4_8282, %655, %int16_8283, %int32_8284, %int100_8285 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6409 = torch.aten.view %6407, %6408 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_8286 = torch.constant.int 1 %6410 = torch.aten.size.int %6409, %int1_8286 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_8287 = torch.constant.int 16 %6411 = torch.aten.mul.int %6410, %int16_8287 : !torch.int, !torch.int -> !torch.int %int4_8288 = torch.constant.int 4 %int32_8289 = torch.constant.int 32 %int100_8290 = torch.constant.int 100 %6412 = torch.prim.ListConstruct %int4_8288, %6411, %int32_8289, %int100_8290 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6413 = torch.aten.view %6409, %6412 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_8291 = torch.constant.int 0 %int0_8292 = torch.constant.int 0 %int9223372036854775807_8293 = torch.constant.int 9223372036854775807 %int1_8294 = torch.constant.int 1 %6414 = torch.aten.slice.Tensor %6155, %int0_8291, %int0_8292, %int9223372036854775807_8293, %int1_8294 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_8295 = torch.constant.int 16 %6415 = torch.aten.mul.int %655, %int16_8295 : !torch.int, !torch.int -> !torch.int %int1_8296 = torch.constant.int 1 %int0_8297 = torch.constant.int 0 %int1_8298 = torch.constant.int 1 %6416 = torch.aten.slice.Tensor %6414, %int1_8296, %int0_8297, %6415, %int1_8298 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_8299 = torch.constant.bool false %6417 = torch.aten.copy %6416, %6413, %false_8299 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_8300 = torch.constant.int 0 %int0_8301 = torch.constant.int 0 %int9223372036854775807_8302 = torch.constant.int 9223372036854775807 %int1_8303 = torch.constant.int 1 %6418 = torch.aten.slice.Tensor %6155, %int0_8300, %int0_8301, %int9223372036854775807_8302, %int1_8303 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8304 = torch.constant.int 1 %int0_8305 = torch.constant.int 0 %int1_8306 = torch.constant.int 1 %6419 = torch.aten.slice_scatter %6418, %6417, %int1_8304, %int0_8305, %6415, %int1_8306 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_8307 = torch.constant.int 0 %int0_8308 = torch.constant.int 0 %int9223372036854775807_8309 = torch.constant.int 9223372036854775807 %int1_8310 = torch.constant.int 1 %6420 = torch.aten.slice_scatter %6155, %6419, %int0_8307, %int0_8308, %int9223372036854775807_8309, %int1_8310 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8311 = torch.constant.int 1 %int1_8312 = torch.constant.int 1 %6421 = torch.aten.add.Scalar %6397, %int1_8311, %int1_8312 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_8313 = torch.constant.int 4 %6422 = torch.aten.mul.int %int4_8313, %655 : !torch.int, !torch.int -> !torch.int %6423 = torch.prim.ListConstruct %6422 : (!torch.int) -> !torch.list %6424 = torch.aten.view %6421, %6423 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_8314 = torch.constant.int 0 %6425 = torch.aten.index_select %6406, %int0_8314, %6424 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_8315 = torch.constant.int 4 %int16_8316 = torch.constant.int 16 %int32_8317 = torch.constant.int 32 %int100_8318 = torch.constant.int 100 %6426 = torch.prim.ListConstruct %int4_8315, %655, %int16_8316, %int32_8317, %int100_8318 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6427 = torch.aten.view %6425, %6426 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_8319 = torch.constant.int 1 %6428 = torch.aten.size.int %6427, %int1_8319 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_8320 = torch.constant.int 16 %6429 = torch.aten.mul.int %6428, %int16_8320 : !torch.int, !torch.int -> !torch.int %int4_8321 = torch.constant.int 4 %int32_8322 = torch.constant.int 32 %int100_8323 = torch.constant.int 100 %6430 = torch.prim.ListConstruct %int4_8321, %6429, %int32_8322, %int100_8323 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6431 = torch.aten.view %6427, %6430 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_8324 = torch.constant.int 0 %int0_8325 = torch.constant.int 0 %int9223372036854775807_8326 = torch.constant.int 9223372036854775807 %int1_8327 = torch.constant.int 1 %6432 = torch.aten.slice.Tensor %6172, %int0_8324, %int0_8325, %int9223372036854775807_8326, %int1_8327 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8328 = torch.constant.int 1 %int0_8329 = torch.constant.int 0 %int1_8330 = torch.constant.int 1 %6433 = torch.aten.slice.Tensor %6432, %int1_8328, %int0_8329, %6415, %int1_8330 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_8331 = torch.constant.bool false %6434 = torch.aten.copy %6433, %6431, %false_8331 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_8332 = torch.constant.int 0 %int0_8333 = torch.constant.int 0 %int9223372036854775807_8334 = torch.constant.int 9223372036854775807 %int1_8335 = torch.constant.int 1 %6435 = torch.aten.slice.Tensor %6172, %int0_8332, %int0_8333, %int9223372036854775807_8334, %int1_8335 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8336 = torch.constant.int 1 %int0_8337 = torch.constant.int 0 %int1_8338 = torch.constant.int 1 %6436 = torch.aten.slice_scatter %6435, %6434, %int1_8336, %int0_8337, %6415, %int1_8338 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_8339 = torch.constant.int 0 %int0_8340 = torch.constant.int 0 %int9223372036854775807_8341 = torch.constant.int 9223372036854775807 %int1_8342 = torch.constant.int 1 %6437 = torch.aten.slice_scatter %6172, %6436, %int0_8339, %int0_8340, %int9223372036854775807_8341, %int1_8342 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_8343 = torch.constant.int 0 %int0_8344 = torch.constant.int 0 %int9223372036854775807_8345 = torch.constant.int 9223372036854775807 %int1_8346 = torch.constant.int 1 %6438 = torch.aten.slice.Tensor %671, %int0_8343, %int0_8344, %int9223372036854775807_8345, %int1_8346 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8347 = torch.constant.int 1 %int0_8348 = torch.constant.int 0 %int1_8349 = torch.constant.int 1 %6439 = torch.aten.slice.Tensor %6438, %int1_8347, %int0_8348, %6415, %int1_8349 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_8350 = torch.constant.int 0 %int0_8351 = torch.constant.int 0 %int9223372036854775807_8352 = torch.constant.int 9223372036854775807 %int1_8353 = torch.constant.int 1 %6440 = torch.aten.slice.Tensor %673, %int0_8350, %int0_8351, %int9223372036854775807_8352, %int1_8353 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8354 = torch.constant.int 1 %int0_8355 = torch.constant.int 0 %int1_8356 = torch.constant.int 1 %6441 = torch.aten.slice.Tensor %6440, %int1_8354, %int0_8355, %6415, %int1_8356 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_8357 = torch.constant.int 1 %int2_8358 = torch.constant.int 2 %6442 = torch.aten.transpose.int %6278, %int1_8357, %int2_8358 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_8359 = torch.constant.int 4 %int32_8360 = torch.constant.int 32 %int1_8361 = torch.constant.int 1 %int100_8362 = torch.constant.int 100 %6443 = torch.prim.ListConstruct %int4_8359, %int32_8360, %int1_8361, %int100_8362 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8363 = torch.constant.bool false %6444 = torch.aten.expand %6442, %6443, %false_8363 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_8364 = torch.constant.int 128 %int1_8365 = torch.constant.int 1 %int100_8366 = torch.constant.int 100 %6445 = torch.prim.ListConstruct %int128_8364, %int1_8365, %int100_8366 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6446 = torch.aten.view %6444, %6445 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_8367 = torch.constant.int 0 %int0_8368 = torch.constant.int 0 %int9223372036854775807_8369 = torch.constant.int 9223372036854775807 %int1_8370 = torch.constant.int 1 %6447 = torch.aten.slice.Tensor %6420, %int0_8367, %int0_8368, %int9223372036854775807_8369, %int1_8370 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8371 = torch.constant.int 1 %int0_8372 = torch.constant.int 0 %int1_8373 = torch.constant.int 1 %6448 = torch.aten.slice.Tensor %6447, %int1_8371, %int0_8372, %6415, %int1_8373 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_8374 = torch.constant.int 1 %int2_8375 = torch.constant.int 2 %6449 = torch.aten.transpose.int %6448, %int1_8374, %int2_8375 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_8376 = torch.constant.int 2 %int3_8377 = torch.constant.int 3 %6450 = torch.aten.transpose.int %6449, %int2_8376, %int3_8377 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_8378 = torch.constant.int 1 %6451 = torch.aten.size.int %6439, %int1_8378 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_8379 = torch.constant.int 4 %int32_8380 = torch.constant.int 32 %int100_8381 = torch.constant.int 100 %6452 = torch.prim.ListConstruct %int4_8379, %int32_8380, %int100_8381, %6451 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8382 = torch.constant.bool false %6453 = torch.aten.expand %6450, %6452, %false_8382 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_8383 = torch.constant.int 0 %6454 = torch.aten.clone %6453, %int0_8383 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_8384 = torch.constant.int 128 %int100_8385 = torch.constant.int 100 %6455 = torch.prim.ListConstruct %int128_8384, %int100_8385, %6451 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6456 = torch.aten._unsafe_view %6454, %6455 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %6457 = torch.aten.bmm %6446, %6456 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_8386 = torch.constant.int 4 %int32_8387 = torch.constant.int 32 %int1_8388 = torch.constant.int 1 %6458 = torch.prim.ListConstruct %int4_8386, %int32_8387, %int1_8388, %6451 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6459 = torch.aten.view %6457, %6458 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_8389 = torch.constant.float 1.000000e+01 %6460 = torch.aten.div.Scalar %6459, %float1.000000e01_8389 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_8390 = torch.constant.int 1 %6461 = torch.aten.add.Tensor %6460, %895, %int1_8390 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_8391 = torch.constant.int -1 %false_8392 = torch.constant.bool false %6462 = torch.aten._softmax %6461, %int-1_8391, %false_8392 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_8393 = torch.constant.int 4 %int32_8394 = torch.constant.int 32 %int1_8395 = torch.constant.int 1 %6463 = torch.prim.ListConstruct %int4_8393, %int32_8394, %int1_8395, %6451 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8396 = torch.constant.bool false %6464 = torch.aten.expand %6462, %6463, %false_8396 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_8397 = torch.constant.int 128 %int1_8398 = torch.constant.int 1 %6465 = torch.prim.ListConstruct %int128_8397, %int1_8398, %6451 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6466 = torch.aten.view %6464, %6465 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_8399 = torch.constant.int 0 %int0_8400 = torch.constant.int 0 %int9223372036854775807_8401 = torch.constant.int 9223372036854775807 %int1_8402 = torch.constant.int 1 %6467 = torch.aten.slice.Tensor %6437, %int0_8399, %int0_8400, %int9223372036854775807_8401, %int1_8402 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8403 = torch.constant.int 1 %int0_8404 = torch.constant.int 0 %int1_8405 = torch.constant.int 1 %6468 = torch.aten.slice.Tensor %6467, %int1_8403, %int0_8404, %6415, %int1_8405 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_8406 = torch.constant.int 1 %int2_8407 = torch.constant.int 2 %6469 = torch.aten.transpose.int %6468, %int1_8406, %int2_8407 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_8408 = torch.constant.int 1 %6470 = torch.aten.size.int %6441, %int1_8408 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_8409 = torch.constant.int 4 %int32_8410 = torch.constant.int 32 %int100_8411 = torch.constant.int 100 %6471 = torch.prim.ListConstruct %int4_8409, %int32_8410, %6470, %int100_8411 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8412 = torch.constant.bool false %6472 = torch.aten.expand %6469, %6471, %false_8412 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_8413 = torch.constant.int 0 %6473 = torch.aten.clone %6472, %int0_8413 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_8414 = torch.constant.int 128 %int100_8415 = torch.constant.int 100 %6474 = torch.prim.ListConstruct %int128_8414, %6470, %int100_8415 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6475 = torch.aten._unsafe_view %6473, %6474 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %6476 = torch.aten.bmm %6466, %6475 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_8416 = torch.constant.int 4 %int32_8417 = torch.constant.int 32 %int1_8418 = torch.constant.int 1 %int100_8419 = torch.constant.int 100 %6477 = torch.prim.ListConstruct %int4_8416, %int32_8417, %int1_8418, %int100_8419 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6478 = torch.aten.view %6476, %6477 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_8420 = torch.constant.int 1 %int2_8421 = torch.constant.int 2 %6479 = torch.aten.transpose.int %6478, %int1_8420, %int2_8421 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_8422 = torch.constant.int 4 %int1_8423 = torch.constant.int 1 %int-1_8424 = torch.constant.int -1 %6480 = torch.prim.ListConstruct %int4_8422, %int1_8423, %int-1_8424 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6481 = torch.aten.view %6479, %6480 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %6482 = torch_c.to_builtin_tensor %6481 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8425 = tensor.cast %6482 : tensor<4x1x3200xf32> to tensor %6483 = torch_c.to_builtin_tensor %195 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6484 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8425, %6483) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8426 = tensor.cast %6484 : tensor to tensor<4x1x3200xf32> %6485 = torch_c.from_builtin_tensor %cast_8426 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_8427 = torch.constant.int 1 %6486 = torch.aten.add.Tensor %6243, %6485, %int1_8427 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_8428 = torch.constant.int 2 %6487 = torch.aten.pow.Tensor_Scalar %6486, %int2_8428 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_8429 = torch.constant.int -1 %6488 = torch.prim.ListConstruct %int-1_8429 : (!torch.int) -> !torch.list %true_8430 = torch.constant.bool true %none_8431 = torch.constant.none %6489 = torch.aten.mean.dim %6487, %6488, %true_8430, %none_8431 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_8432 = torch.constant.float 9.9999999747524271E-7 %int1_8433 = torch.constant.int 1 %6490 = torch.aten.add.Scalar %6489, %float9.999990e-07_8432, %int1_8433 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %6491 = torch.aten.rsqrt %6490 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %6492 = torch.aten.mul.Tensor %6486, %6491 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %6493 = torch.aten.mul.Tensor %6492, %196 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %6494 = torch_c.to_builtin_tensor %6493 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8434 = tensor.cast %6494 : tensor<4x1x3200xf32> to tensor %6495 = torch_c.to_builtin_tensor %197 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %6496 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_8434, %6495) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_8435 = tensor.cast %6496 : tensor to tensor<4x1x8640xf32> %6497 = torch_c.from_builtin_tensor %cast_8435 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %6498 = torch.aten.silu %6497 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %6499 = torch_c.to_builtin_tensor %6493 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8436 = tensor.cast %6499 : tensor<4x1x3200xf32> to tensor %6500 = torch_c.to_builtin_tensor %198 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %6501 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_8436, %6500) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_8437 = tensor.cast %6501 : tensor to tensor<4x1x8640xf32> %6502 = torch_c.from_builtin_tensor %cast_8437 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %6503 = torch.aten.mul.Tensor %6498, %6502 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %6504 = torch_c.to_builtin_tensor %6503 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_8438 = tensor.cast %6504 : tensor<4x1x8640xf32> to tensor %6505 = torch_c.to_builtin_tensor %199 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %6506 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_8438, %6505) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_8439 = tensor.cast %6506 : tensor to tensor<4x1x3200xf32> %6507 = torch_c.from_builtin_tensor %cast_8439 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_8440 = torch.constant.int 1 %6508 = torch.aten.add.Tensor %6486, %6507, %int1_8440 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_8441 = torch.constant.int 2 %6509 = torch.aten.pow.Tensor_Scalar %6508, %int2_8441 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_8442 = torch.constant.int -1 %6510 = torch.prim.ListConstruct %int-1_8442 : (!torch.int) -> !torch.list %true_8443 = torch.constant.bool true %none_8444 = torch.constant.none %6511 = torch.aten.mean.dim %6509, %6510, %true_8443, %none_8444 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_8445 = torch.constant.float 9.9999999747524271E-7 %int1_8446 = torch.constant.int 1 %6512 = torch.aten.add.Scalar %6511, %float9.999990e-07_8445, %int1_8446 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %6513 = torch.aten.rsqrt %6512 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %6514 = torch.aten.mul.Tensor %6508, %6513 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %6515 = torch.aten.mul.Tensor %6514, %200 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %6516 = torch_c.to_builtin_tensor %6515 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8447 = tensor.cast %6516 : tensor<4x1x3200xf32> to tensor %6517 = torch_c.to_builtin_tensor %201 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6518 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8447, %6517) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8448 = tensor.cast %6518 : tensor to tensor<4x1x3200xf32> %6519 = torch_c.from_builtin_tensor %cast_8448 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %6520 = torch_c.to_builtin_tensor %6515 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8449 = tensor.cast %6520 : tensor<4x1x3200xf32> to tensor %6521 = torch_c.to_builtin_tensor %202 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6522 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8449, %6521) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8450 = tensor.cast %6522 : tensor to tensor<4x1x3200xf32> %6523 = torch_c.from_builtin_tensor %cast_8450 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %6524 = torch_c.to_builtin_tensor %6515 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8451 = tensor.cast %6524 : tensor<4x1x3200xf32> to tensor %6525 = torch_c.to_builtin_tensor %203 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6526 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8451, %6525) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8452 = tensor.cast %6526 : tensor to tensor<4x1x3200xf32> %6527 = torch_c.from_builtin_tensor %cast_8452 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_8453 = torch.constant.int 4 %int1_8454 = torch.constant.int 1 %int32_8455 = torch.constant.int 32 %int100_8456 = torch.constant.int 100 %6528 = torch.prim.ListConstruct %int4_8453, %int1_8454, %int32_8455, %int100_8456 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6529 = torch.aten.view %6519, %6528 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_8457 = torch.constant.int 4 %int1_8458 = torch.constant.int 1 %int32_8459 = torch.constant.int 32 %int100_8460 = torch.constant.int 100 %6530 = torch.prim.ListConstruct %int4_8457, %int1_8458, %int32_8459, %int100_8460 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6531 = torch.aten.view %6523, %6530 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_8461 = torch.constant.int 4 %int1_8462 = torch.constant.int 1 %int32_8463 = torch.constant.int 32 %int100_8464 = torch.constant.int 100 %6532 = torch.prim.ListConstruct %int4_8461, %int1_8462, %int32_8463, %int100_8464 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6533 = torch.aten.view %6527, %6532 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_8465 = torch.constant.int 4 %int1_8466 = torch.constant.int 1 %int32_8467 = torch.constant.int 32 %int-1_8468 = torch.constant.int -1 %int2_8469 = torch.constant.int 2 %6534 = torch.prim.ListConstruct %int4_8465, %int1_8466, %int32_8467, %int-1_8468, %int2_8469 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6535 = torch.aten.view %6529, %6534 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %6536 = torch.aten.view_as_complex %6535 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_8470 = torch.constant.int 4 %int1_8471 = torch.constant.int 1 %int32_8472 = torch.constant.int 32 %int-1_8473 = torch.constant.int -1 %int2_8474 = torch.constant.int 2 %6537 = torch.prim.ListConstruct %int4_8470, %int1_8471, %int32_8472, %int-1_8473, %int2_8474 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6538 = torch.aten.view %6531, %6537 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %6539 = torch.aten.view_as_complex %6538 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %6540 = torch.aten.mul.Tensor %6536, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %6541 = torch.aten.view_as_real %6540 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_8475 = torch.constant.int 4 %int1_8476 = torch.constant.int 1 %int32_8477 = torch.constant.int 32 %int100_8478 = torch.constant.int 100 %6542 = torch.prim.ListConstruct %int4_8475, %int1_8476, %int32_8477, %int100_8478 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6543 = torch.aten.view %6541, %6542 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %6544 = torch.aten.mul.Tensor %6539, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %6545 = torch.aten.view_as_real %6544 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_8479 = torch.constant.int 4 %int1_8480 = torch.constant.int 1 %int32_8481 = torch.constant.int 32 %int100_8482 = torch.constant.int 100 %6546 = torch.prim.ListConstruct %int4_8479, %int1_8480, %int32_8481, %int100_8482 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6547 = torch.aten.view %6545, %6546 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_8483 = torch.constant.int 1 %int1_8484 = torch.constant.int 1 %6548 = torch.aten.add.Scalar %arg2, %int1_8483, %int1_8484 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_8485 = torch.constant.int 0 %int0_8486 = torch.constant.int 0 %6549 = torch.aten.select.int %6548, %int0_8485, %int0_8486 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8487 = torch.constant.int 0 %int0_8488 = torch.constant.int 0 %6550 = torch.aten.select.int %arg3, %int0_8487, %int0_8488 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8489 = torch.constant.int 0 %int0_8490 = torch.constant.int 0 %int9223372036854775807_8491 = torch.constant.int 9223372036854775807 %int1_8492 = torch.constant.int 1 %6551 = torch.aten.slice.Tensor %6550, %int0_8489, %int0_8490, %int9223372036854775807_8491, %int1_8492 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8493 = torch.constant.int 16 %6552 = torch.aten.floor_divide.Scalar %6549, %int16_8493 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8494 = torch.constant.int 0 %6553 = torch.aten.index_select %6551, %int0_8494, %6552 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8495 = torch.constant.int 16 %6554 = torch.aten.remainder.Scalar %6549, %int16_8495 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8496 = torch.constant.none %6555 = torch.aten.clone %590, %none_8496 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8497 = torch.constant.none %6556 = torch.aten.clone %591, %none_8497 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8498 = torch.constant.int 0 %6557 = torch.aten.unsqueeze %6554, %int0_8498 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8499 = torch.constant.int 0 %int0_8500 = torch.constant.int 0 %6558 = torch.aten.select.int %6547, %int0_8499, %int0_8500 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8501 = torch.constant.int 0 %int0_8502 = torch.constant.int 0 %6559 = torch.aten.select.int %6558, %int0_8501, %int0_8502 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_8503 = torch.constant.int -1 %int26_8504 = torch.constant.int 26 %int2_8505 = torch.constant.int 2 %int16_8506 = torch.constant.int 16 %int32_8507 = torch.constant.int 32 %int100_8508 = torch.constant.int 100 %6560 = torch.prim.ListConstruct %int-1_8503, %int26_8504, %int2_8505, %int16_8506, %int32_8507, %int100_8508 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6561 = torch.aten.view %6395, %6560 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %6562 = torch.prim.ListConstruct %6553, %6555, %6556, %6557 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8509 = torch.constant.bool false %6563 = torch.aten.index_put %6561, %6562, %6559, %false_8509 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8510 = torch.constant.int 2662400 %6564 = torch.prim.ListConstruct %731, %int2662400_8510 : (!torch.int, !torch.int) -> !torch.list %6565 = torch.aten.view %6563, %6564 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8511 = torch.constant.int -1 %int26_8512 = torch.constant.int 26 %int2_8513 = torch.constant.int 2 %int16_8514 = torch.constant.int 16 %int32_8515 = torch.constant.int 32 %int100_8516 = torch.constant.int 100 %6566 = torch.prim.ListConstruct %int-1_8511, %int26_8512, %int2_8513, %int16_8514, %int32_8515, %int100_8516 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6567 = torch.aten.view %6565, %6566 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8517 = torch.constant.none %6568 = torch.aten.clone %592, %none_8517 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8518 = torch.constant.none %6569 = torch.aten.clone %593, %none_8518 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8519 = torch.constant.int 0 %6570 = torch.aten.unsqueeze %6554, %int0_8519 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8520 = torch.constant.int 0 %int0_8521 = torch.constant.int 0 %6571 = torch.aten.select.int %6533, %int0_8520, %int0_8521 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8522 = torch.constant.int 0 %int0_8523 = torch.constant.int 0 %6572 = torch.aten.select.int %6571, %int0_8522, %int0_8523 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6573 = torch.prim.ListConstruct %6553, %6568, %6569, %6570 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8524 = torch.constant.bool false %6574 = torch.aten.index_put %6567, %6573, %6572, %false_8524 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8525 = torch.constant.int 2662400 %6575 = torch.prim.ListConstruct %731, %int2662400_8525 : (!torch.int, !torch.int) -> !torch.list %6576 = torch.aten.view %6574, %6575 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8526 = torch.constant.int -1 %int26_8527 = torch.constant.int 26 %int2_8528 = torch.constant.int 2 %int16_8529 = torch.constant.int 16 %int32_8530 = torch.constant.int 32 %int100_8531 = torch.constant.int 100 %6577 = torch.prim.ListConstruct %int-1_8526, %int26_8527, %int2_8528, %int16_8529, %int32_8530, %int100_8531 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6578 = torch.aten.view %6576, %6577 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_8532 = torch.constant.int 0 %int1_8533 = torch.constant.int 1 %6579 = torch.aten.select.int %6548, %int0_8532, %int1_8533 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8534 = torch.constant.int 0 %int1_8535 = torch.constant.int 1 %6580 = torch.aten.select.int %arg3, %int0_8534, %int1_8535 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8536 = torch.constant.int 0 %int0_8537 = torch.constant.int 0 %int9223372036854775807_8538 = torch.constant.int 9223372036854775807 %int1_8539 = torch.constant.int 1 %6581 = torch.aten.slice.Tensor %6580, %int0_8536, %int0_8537, %int9223372036854775807_8538, %int1_8539 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8540 = torch.constant.int 16 %6582 = torch.aten.floor_divide.Scalar %6579, %int16_8540 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8541 = torch.constant.int 0 %6583 = torch.aten.index_select %6581, %int0_8541, %6582 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8542 = torch.constant.int 16 %6584 = torch.aten.remainder.Scalar %6579, %int16_8542 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8543 = torch.constant.none %6585 = torch.aten.clone %594, %none_8543 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8544 = torch.constant.none %6586 = torch.aten.clone %595, %none_8544 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8545 = torch.constant.int 0 %6587 = torch.aten.unsqueeze %6584, %int0_8545 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8546 = torch.constant.int 0 %int1_8547 = torch.constant.int 1 %6588 = torch.aten.select.int %6547, %int0_8546, %int1_8547 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8548 = torch.constant.int 0 %int0_8549 = torch.constant.int 0 %6589 = torch.aten.select.int %6588, %int0_8548, %int0_8549 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6590 = torch.prim.ListConstruct %6583, %6585, %6586, %6587 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8550 = torch.constant.bool false %6591 = torch.aten.index_put %6578, %6590, %6589, %false_8550 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8551 = torch.constant.int 2662400 %6592 = torch.prim.ListConstruct %731, %int2662400_8551 : (!torch.int, !torch.int) -> !torch.list %6593 = torch.aten.view %6591, %6592 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8552 = torch.constant.int -1 %int26_8553 = torch.constant.int 26 %int2_8554 = torch.constant.int 2 %int16_8555 = torch.constant.int 16 %int32_8556 = torch.constant.int 32 %int100_8557 = torch.constant.int 100 %6594 = torch.prim.ListConstruct %int-1_8552, %int26_8553, %int2_8554, %int16_8555, %int32_8556, %int100_8557 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6595 = torch.aten.view %6593, %6594 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8558 = torch.constant.none %6596 = torch.aten.clone %596, %none_8558 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8559 = torch.constant.none %6597 = torch.aten.clone %597, %none_8559 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8560 = torch.constant.int 0 %6598 = torch.aten.unsqueeze %6584, %int0_8560 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8561 = torch.constant.int 0 %int1_8562 = torch.constant.int 1 %6599 = torch.aten.select.int %6533, %int0_8561, %int1_8562 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8563 = torch.constant.int 0 %int0_8564 = torch.constant.int 0 %6600 = torch.aten.select.int %6599, %int0_8563, %int0_8564 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6601 = torch.prim.ListConstruct %6583, %6596, %6597, %6598 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8565 = torch.constant.bool false %6602 = torch.aten.index_put %6595, %6601, %6600, %false_8565 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8566 = torch.constant.int 2662400 %6603 = torch.prim.ListConstruct %731, %int2662400_8566 : (!torch.int, !torch.int) -> !torch.list %6604 = torch.aten.view %6602, %6603 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8567 = torch.constant.int -1 %int26_8568 = torch.constant.int 26 %int2_8569 = torch.constant.int 2 %int16_8570 = torch.constant.int 16 %int32_8571 = torch.constant.int 32 %int100_8572 = torch.constant.int 100 %6605 = torch.prim.ListConstruct %int-1_8567, %int26_8568, %int2_8569, %int16_8570, %int32_8571, %int100_8572 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6606 = torch.aten.view %6604, %6605 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_8573 = torch.constant.int 0 %int2_8574 = torch.constant.int 2 %6607 = torch.aten.select.int %6548, %int0_8573, %int2_8574 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8575 = torch.constant.int 0 %int2_8576 = torch.constant.int 2 %6608 = torch.aten.select.int %arg3, %int0_8575, %int2_8576 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8577 = torch.constant.int 0 %int0_8578 = torch.constant.int 0 %int9223372036854775807_8579 = torch.constant.int 9223372036854775807 %int1_8580 = torch.constant.int 1 %6609 = torch.aten.slice.Tensor %6608, %int0_8577, %int0_8578, %int9223372036854775807_8579, %int1_8580 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8581 = torch.constant.int 16 %6610 = torch.aten.floor_divide.Scalar %6607, %int16_8581 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8582 = torch.constant.int 0 %6611 = torch.aten.index_select %6609, %int0_8582, %6610 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8583 = torch.constant.int 16 %6612 = torch.aten.remainder.Scalar %6607, %int16_8583 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8584 = torch.constant.none %6613 = torch.aten.clone %598, %none_8584 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8585 = torch.constant.none %6614 = torch.aten.clone %599, %none_8585 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8586 = torch.constant.int 0 %6615 = torch.aten.unsqueeze %6612, %int0_8586 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8587 = torch.constant.int 0 %int2_8588 = torch.constant.int 2 %6616 = torch.aten.select.int %6547, %int0_8587, %int2_8588 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8589 = torch.constant.int 0 %int0_8590 = torch.constant.int 0 %6617 = torch.aten.select.int %6616, %int0_8589, %int0_8590 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6618 = torch.prim.ListConstruct %6611, %6613, %6614, %6615 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8591 = torch.constant.bool false %6619 = torch.aten.index_put %6606, %6618, %6617, %false_8591 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8592 = torch.constant.int 2662400 %6620 = torch.prim.ListConstruct %731, %int2662400_8592 : (!torch.int, !torch.int) -> !torch.list %6621 = torch.aten.view %6619, %6620 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8593 = torch.constant.int -1 %int26_8594 = torch.constant.int 26 %int2_8595 = torch.constant.int 2 %int16_8596 = torch.constant.int 16 %int32_8597 = torch.constant.int 32 %int100_8598 = torch.constant.int 100 %6622 = torch.prim.ListConstruct %int-1_8593, %int26_8594, %int2_8595, %int16_8596, %int32_8597, %int100_8598 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6623 = torch.aten.view %6621, %6622 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8599 = torch.constant.none %6624 = torch.aten.clone %600, %none_8599 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8600 = torch.constant.none %6625 = torch.aten.clone %601, %none_8600 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8601 = torch.constant.int 0 %6626 = torch.aten.unsqueeze %6612, %int0_8601 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8602 = torch.constant.int 0 %int2_8603 = torch.constant.int 2 %6627 = torch.aten.select.int %6533, %int0_8602, %int2_8603 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8604 = torch.constant.int 0 %int0_8605 = torch.constant.int 0 %6628 = torch.aten.select.int %6627, %int0_8604, %int0_8605 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6629 = torch.prim.ListConstruct %6611, %6624, %6625, %6626 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8606 = torch.constant.bool false %6630 = torch.aten.index_put %6623, %6629, %6628, %false_8606 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8607 = torch.constant.int 2662400 %6631 = torch.prim.ListConstruct %731, %int2662400_8607 : (!torch.int, !torch.int) -> !torch.list %6632 = torch.aten.view %6630, %6631 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8608 = torch.constant.int -1 %int26_8609 = torch.constant.int 26 %int2_8610 = torch.constant.int 2 %int16_8611 = torch.constant.int 16 %int32_8612 = torch.constant.int 32 %int100_8613 = torch.constant.int 100 %6633 = torch.prim.ListConstruct %int-1_8608, %int26_8609, %int2_8610, %int16_8611, %int32_8612, %int100_8613 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6634 = torch.aten.view %6632, %6633 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_8614 = torch.constant.int 0 %int3_8615 = torch.constant.int 3 %6635 = torch.aten.select.int %6548, %int0_8614, %int3_8615 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8616 = torch.constant.int 0 %int3_8617 = torch.constant.int 3 %6636 = torch.aten.select.int %arg3, %int0_8616, %int3_8617 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8618 = torch.constant.int 0 %int0_8619 = torch.constant.int 0 %int9223372036854775807_8620 = torch.constant.int 9223372036854775807 %int1_8621 = torch.constant.int 1 %6637 = torch.aten.slice.Tensor %6636, %int0_8618, %int0_8619, %int9223372036854775807_8620, %int1_8621 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8622 = torch.constant.int 16 %6638 = torch.aten.floor_divide.Scalar %6635, %int16_8622 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8623 = torch.constant.int 0 %6639 = torch.aten.index_select %6637, %int0_8623, %6638 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8624 = torch.constant.int 16 %6640 = torch.aten.remainder.Scalar %6635, %int16_8624 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8625 = torch.constant.none %6641 = torch.aten.clone %602, %none_8625 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8626 = torch.constant.none %6642 = torch.aten.clone %603, %none_8626 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8627 = torch.constant.int 0 %6643 = torch.aten.unsqueeze %6640, %int0_8627 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8628 = torch.constant.int 0 %int3_8629 = torch.constant.int 3 %6644 = torch.aten.select.int %6547, %int0_8628, %int3_8629 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8630 = torch.constant.int 0 %int0_8631 = torch.constant.int 0 %6645 = torch.aten.select.int %6644, %int0_8630, %int0_8631 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6646 = torch.prim.ListConstruct %6639, %6641, %6642, %6643 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8632 = torch.constant.bool false %6647 = torch.aten.index_put %6634, %6646, %6645, %false_8632 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8633 = torch.constant.int 2662400 %6648 = torch.prim.ListConstruct %731, %int2662400_8633 : (!torch.int, !torch.int) -> !torch.list %6649 = torch.aten.view %6647, %6648 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8634 = torch.constant.int -1 %int26_8635 = torch.constant.int 26 %int2_8636 = torch.constant.int 2 %int16_8637 = torch.constant.int 16 %int32_8638 = torch.constant.int 32 %int100_8639 = torch.constant.int 100 %6650 = torch.prim.ListConstruct %int-1_8634, %int26_8635, %int2_8636, %int16_8637, %int32_8638, %int100_8639 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6651 = torch.aten.view %6649, %6650 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8640 = torch.constant.none %6652 = torch.aten.clone %604, %none_8640 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8641 = torch.constant.none %6653 = torch.aten.clone %605, %none_8641 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8642 = torch.constant.int 0 %6654 = torch.aten.unsqueeze %6640, %int0_8642 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8643 = torch.constant.int 0 %int3_8644 = torch.constant.int 3 %6655 = torch.aten.select.int %6533, %int0_8643, %int3_8644 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8645 = torch.constant.int 0 %int0_8646 = torch.constant.int 0 %6656 = torch.aten.select.int %6655, %int0_8645, %int0_8646 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6657 = torch.prim.ListConstruct %6639, %6652, %6653, %6654 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8647 = torch.constant.bool false %6658 = torch.aten.index_put %6651, %6657, %6656, %false_8647 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8648 = torch.constant.int 2662400 %6659 = torch.prim.ListConstruct %731, %int2662400_8648 : (!torch.int, !torch.int) -> !torch.list %6660 = torch.aten.view %6658, %6659 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_8649 = torch.constant.int 52 %6661 = torch.aten.mul.Scalar %arg3, %int52_8649 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int44 = torch.constant.int 44 %int1_8650 = torch.constant.int 1 %6662 = torch.aten.add.Scalar %6661, %int44, %int1_8650 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_8651 = torch.constant.int 4 %6663 = torch.aten.mul.int %int4_8651, %655 : !torch.int, !torch.int -> !torch.int %6664 = torch.prim.ListConstruct %6663 : (!torch.int) -> !torch.list %6665 = torch.aten.view %6662, %6664 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_8652 = torch.constant.int -1 %int26_8653 = torch.constant.int 26 %int2_8654 = torch.constant.int 2 %int16_8655 = torch.constant.int 16 %int32_8656 = torch.constant.int 32 %int100_8657 = torch.constant.int 100 %6666 = torch.prim.ListConstruct %int-1_8652, %int26_8653, %int2_8654, %int16_8655, %int32_8656, %int100_8657 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6667 = torch.aten.view %6660, %6666 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_8658 = torch.constant.int 26 %6668 = torch.aten.mul.int %731, %int26_8658 : !torch.int, !torch.int -> !torch.int %int2_8659 = torch.constant.int 2 %6669 = torch.aten.mul.int %6668, %int2_8659 : !torch.int, !torch.int -> !torch.int %int16_8660 = torch.constant.int 16 %int32_8661 = torch.constant.int 32 %int100_8662 = torch.constant.int 100 %6670 = torch.prim.ListConstruct %6669, %int16_8660, %int32_8661, %int100_8662 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6671 = torch.aten.view %6667, %6670 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_8663 = torch.constant.int 0 %6672 = torch.aten.index_select %6671, %int0_8663, %6665 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_8664 = torch.constant.int 4 %int16_8665 = torch.constant.int 16 %int32_8666 = torch.constant.int 32 %int100_8667 = torch.constant.int 100 %6673 = torch.prim.ListConstruct %int4_8664, %655, %int16_8665, %int32_8666, %int100_8667 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6674 = torch.aten.view %6672, %6673 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_8668 = torch.constant.int 1 %6675 = torch.aten.size.int %6674, %int1_8668 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_8669 = torch.constant.int 16 %6676 = torch.aten.mul.int %6675, %int16_8669 : !torch.int, !torch.int -> !torch.int %int4_8670 = torch.constant.int 4 %int32_8671 = torch.constant.int 32 %int100_8672 = torch.constant.int 100 %6677 = torch.prim.ListConstruct %int4_8670, %6676, %int32_8671, %int100_8672 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6678 = torch.aten.view %6674, %6677 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_8673 = torch.constant.int 0 %int0_8674 = torch.constant.int 0 %int9223372036854775807_8675 = torch.constant.int 9223372036854775807 %int1_8676 = torch.constant.int 1 %6679 = torch.aten.slice.Tensor %6420, %int0_8673, %int0_8674, %int9223372036854775807_8675, %int1_8676 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_8677 = torch.constant.int 16 %6680 = torch.aten.mul.int %655, %int16_8677 : !torch.int, !torch.int -> !torch.int %int1_8678 = torch.constant.int 1 %int0_8679 = torch.constant.int 0 %int1_8680 = torch.constant.int 1 %6681 = torch.aten.slice.Tensor %6679, %int1_8678, %int0_8679, %6680, %int1_8680 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_8681 = torch.constant.bool false %6682 = torch.aten.copy %6681, %6678, %false_8681 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_8682 = torch.constant.int 0 %int0_8683 = torch.constant.int 0 %int9223372036854775807_8684 = torch.constant.int 9223372036854775807 %int1_8685 = torch.constant.int 1 %6683 = torch.aten.slice.Tensor %6420, %int0_8682, %int0_8683, %int9223372036854775807_8684, %int1_8685 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8686 = torch.constant.int 1 %int0_8687 = torch.constant.int 0 %int1_8688 = torch.constant.int 1 %6684 = torch.aten.slice_scatter %6683, %6682, %int1_8686, %int0_8687, %6680, %int1_8688 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_8689 = torch.constant.int 0 %int0_8690 = torch.constant.int 0 %int9223372036854775807_8691 = torch.constant.int 9223372036854775807 %int1_8692 = torch.constant.int 1 %6685 = torch.aten.slice_scatter %6420, %6684, %int0_8689, %int0_8690, %int9223372036854775807_8691, %int1_8692 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8693 = torch.constant.int 1 %int1_8694 = torch.constant.int 1 %6686 = torch.aten.add.Scalar %6662, %int1_8693, %int1_8694 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_8695 = torch.constant.int 4 %6687 = torch.aten.mul.int %int4_8695, %655 : !torch.int, !torch.int -> !torch.int %6688 = torch.prim.ListConstruct %6687 : (!torch.int) -> !torch.list %6689 = torch.aten.view %6686, %6688 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_8696 = torch.constant.int 0 %6690 = torch.aten.index_select %6671, %int0_8696, %6689 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_8697 = torch.constant.int 4 %int16_8698 = torch.constant.int 16 %int32_8699 = torch.constant.int 32 %int100_8700 = torch.constant.int 100 %6691 = torch.prim.ListConstruct %int4_8697, %655, %int16_8698, %int32_8699, %int100_8700 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6692 = torch.aten.view %6690, %6691 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_8701 = torch.constant.int 1 %6693 = torch.aten.size.int %6692, %int1_8701 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_8702 = torch.constant.int 16 %6694 = torch.aten.mul.int %6693, %int16_8702 : !torch.int, !torch.int -> !torch.int %int4_8703 = torch.constant.int 4 %int32_8704 = torch.constant.int 32 %int100_8705 = torch.constant.int 100 %6695 = torch.prim.ListConstruct %int4_8703, %6694, %int32_8704, %int100_8705 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6696 = torch.aten.view %6692, %6695 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_8706 = torch.constant.int 0 %int0_8707 = torch.constant.int 0 %int9223372036854775807_8708 = torch.constant.int 9223372036854775807 %int1_8709 = torch.constant.int 1 %6697 = torch.aten.slice.Tensor %6437, %int0_8706, %int0_8707, %int9223372036854775807_8708, %int1_8709 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8710 = torch.constant.int 1 %int0_8711 = torch.constant.int 0 %int1_8712 = torch.constant.int 1 %6698 = torch.aten.slice.Tensor %6697, %int1_8710, %int0_8711, %6680, %int1_8712 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_8713 = torch.constant.bool false %6699 = torch.aten.copy %6698, %6696, %false_8713 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_8714 = torch.constant.int 0 %int0_8715 = torch.constant.int 0 %int9223372036854775807_8716 = torch.constant.int 9223372036854775807 %int1_8717 = torch.constant.int 1 %6700 = torch.aten.slice.Tensor %6437, %int0_8714, %int0_8715, %int9223372036854775807_8716, %int1_8717 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8718 = torch.constant.int 1 %int0_8719 = torch.constant.int 0 %int1_8720 = torch.constant.int 1 %6701 = torch.aten.slice_scatter %6700, %6699, %int1_8718, %int0_8719, %6680, %int1_8720 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_8721 = torch.constant.int 0 %int0_8722 = torch.constant.int 0 %int9223372036854775807_8723 = torch.constant.int 9223372036854775807 %int1_8724 = torch.constant.int 1 %6702 = torch.aten.slice_scatter %6437, %6701, %int0_8721, %int0_8722, %int9223372036854775807_8723, %int1_8724 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_8725 = torch.constant.int 0 %int0_8726 = torch.constant.int 0 %int9223372036854775807_8727 = torch.constant.int 9223372036854775807 %int1_8728 = torch.constant.int 1 %6703 = torch.aten.slice.Tensor %671, %int0_8725, %int0_8726, %int9223372036854775807_8727, %int1_8728 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8729 = torch.constant.int 1 %int0_8730 = torch.constant.int 0 %int1_8731 = torch.constant.int 1 %6704 = torch.aten.slice.Tensor %6703, %int1_8729, %int0_8730, %6680, %int1_8731 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_8732 = torch.constant.int 0 %int0_8733 = torch.constant.int 0 %int9223372036854775807_8734 = torch.constant.int 9223372036854775807 %int1_8735 = torch.constant.int 1 %6705 = torch.aten.slice.Tensor %673, %int0_8732, %int0_8733, %int9223372036854775807_8734, %int1_8735 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8736 = torch.constant.int 1 %int0_8737 = torch.constant.int 0 %int1_8738 = torch.constant.int 1 %6706 = torch.aten.slice.Tensor %6705, %int1_8736, %int0_8737, %6680, %int1_8738 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_8739 = torch.constant.int 1 %int2_8740 = torch.constant.int 2 %6707 = torch.aten.transpose.int %6543, %int1_8739, %int2_8740 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_8741 = torch.constant.int 4 %int32_8742 = torch.constant.int 32 %int1_8743 = torch.constant.int 1 %int100_8744 = torch.constant.int 100 %6708 = torch.prim.ListConstruct %int4_8741, %int32_8742, %int1_8743, %int100_8744 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8745 = torch.constant.bool false %6709 = torch.aten.expand %6707, %6708, %false_8745 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_8746 = torch.constant.int 128 %int1_8747 = torch.constant.int 1 %int100_8748 = torch.constant.int 100 %6710 = torch.prim.ListConstruct %int128_8746, %int1_8747, %int100_8748 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6711 = torch.aten.view %6709, %6710 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_8749 = torch.constant.int 0 %int0_8750 = torch.constant.int 0 %int9223372036854775807_8751 = torch.constant.int 9223372036854775807 %int1_8752 = torch.constant.int 1 %6712 = torch.aten.slice.Tensor %6685, %int0_8749, %int0_8750, %int9223372036854775807_8751, %int1_8752 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8753 = torch.constant.int 1 %int0_8754 = torch.constant.int 0 %int1_8755 = torch.constant.int 1 %6713 = torch.aten.slice.Tensor %6712, %int1_8753, %int0_8754, %6680, %int1_8755 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_8756 = torch.constant.int 1 %int2_8757 = torch.constant.int 2 %6714 = torch.aten.transpose.int %6713, %int1_8756, %int2_8757 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_8758 = torch.constant.int 2 %int3_8759 = torch.constant.int 3 %6715 = torch.aten.transpose.int %6714, %int2_8758, %int3_8759 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_8760 = torch.constant.int 1 %6716 = torch.aten.size.int %6704, %int1_8760 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_8761 = torch.constant.int 4 %int32_8762 = torch.constant.int 32 %int100_8763 = torch.constant.int 100 %6717 = torch.prim.ListConstruct %int4_8761, %int32_8762, %int100_8763, %6716 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8764 = torch.constant.bool false %6718 = torch.aten.expand %6715, %6717, %false_8764 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_8765 = torch.constant.int 0 %6719 = torch.aten.clone %6718, %int0_8765 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_8766 = torch.constant.int 128 %int100_8767 = torch.constant.int 100 %6720 = torch.prim.ListConstruct %int128_8766, %int100_8767, %6716 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6721 = torch.aten._unsafe_view %6719, %6720 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %6722 = torch.aten.bmm %6711, %6721 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_8768 = torch.constant.int 4 %int32_8769 = torch.constant.int 32 %int1_8770 = torch.constant.int 1 %6723 = torch.prim.ListConstruct %int4_8768, %int32_8769, %int1_8770, %6716 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6724 = torch.aten.view %6722, %6723 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_8771 = torch.constant.float 1.000000e+01 %6725 = torch.aten.div.Scalar %6724, %float1.000000e01_8771 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_8772 = torch.constant.int 1 %6726 = torch.aten.add.Tensor %6725, %895, %int1_8772 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_8773 = torch.constant.int -1 %false_8774 = torch.constant.bool false %6727 = torch.aten._softmax %6726, %int-1_8773, %false_8774 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_8775 = torch.constant.int 4 %int32_8776 = torch.constant.int 32 %int1_8777 = torch.constant.int 1 %6728 = torch.prim.ListConstruct %int4_8775, %int32_8776, %int1_8777, %6716 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8778 = torch.constant.bool false %6729 = torch.aten.expand %6727, %6728, %false_8778 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_8779 = torch.constant.int 128 %int1_8780 = torch.constant.int 1 %6730 = torch.prim.ListConstruct %int128_8779, %int1_8780, %6716 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6731 = torch.aten.view %6729, %6730 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_8781 = torch.constant.int 0 %int0_8782 = torch.constant.int 0 %int9223372036854775807_8783 = torch.constant.int 9223372036854775807 %int1_8784 = torch.constant.int 1 %6732 = torch.aten.slice.Tensor %6702, %int0_8781, %int0_8782, %int9223372036854775807_8783, %int1_8784 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_8785 = torch.constant.int 1 %int0_8786 = torch.constant.int 0 %int1_8787 = torch.constant.int 1 %6733 = torch.aten.slice.Tensor %6732, %int1_8785, %int0_8786, %6680, %int1_8787 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_8788 = torch.constant.int 1 %int2_8789 = torch.constant.int 2 %6734 = torch.aten.transpose.int %6733, %int1_8788, %int2_8789 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_8790 = torch.constant.int 1 %6735 = torch.aten.size.int %6706, %int1_8790 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_8791 = torch.constant.int 4 %int32_8792 = torch.constant.int 32 %int100_8793 = torch.constant.int 100 %6736 = torch.prim.ListConstruct %int4_8791, %int32_8792, %6735, %int100_8793 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_8794 = torch.constant.bool false %6737 = torch.aten.expand %6734, %6736, %false_8794 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_8795 = torch.constant.int 0 %6738 = torch.aten.clone %6737, %int0_8795 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_8796 = torch.constant.int 128 %int100_8797 = torch.constant.int 100 %6739 = torch.prim.ListConstruct %int128_8796, %6735, %int100_8797 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6740 = torch.aten._unsafe_view %6738, %6739 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %6741 = torch.aten.bmm %6731, %6740 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_8798 = torch.constant.int 4 %int32_8799 = torch.constant.int 32 %int1_8800 = torch.constant.int 1 %int100_8801 = torch.constant.int 100 %6742 = torch.prim.ListConstruct %int4_8798, %int32_8799, %int1_8800, %int100_8801 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6743 = torch.aten.view %6741, %6742 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_8802 = torch.constant.int 1 %int2_8803 = torch.constant.int 2 %6744 = torch.aten.transpose.int %6743, %int1_8802, %int2_8803 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_8804 = torch.constant.int 4 %int1_8805 = torch.constant.int 1 %int-1_8806 = torch.constant.int -1 %6745 = torch.prim.ListConstruct %int4_8804, %int1_8805, %int-1_8806 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6746 = torch.aten.view %6744, %6745 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %6747 = torch_c.to_builtin_tensor %6746 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8807 = tensor.cast %6747 : tensor<4x1x3200xf32> to tensor %6748 = torch_c.to_builtin_tensor %204 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6749 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8807, %6748) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8808 = tensor.cast %6749 : tensor to tensor<4x1x3200xf32> %6750 = torch_c.from_builtin_tensor %cast_8808 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_8809 = torch.constant.int 1 %6751 = torch.aten.add.Tensor %6508, %6750, %int1_8809 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_8810 = torch.constant.int 2 %6752 = torch.aten.pow.Tensor_Scalar %6751, %int2_8810 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_8811 = torch.constant.int -1 %6753 = torch.prim.ListConstruct %int-1_8811 : (!torch.int) -> !torch.list %true_8812 = torch.constant.bool true %none_8813 = torch.constant.none %6754 = torch.aten.mean.dim %6752, %6753, %true_8812, %none_8813 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_8814 = torch.constant.float 9.9999999747524271E-7 %int1_8815 = torch.constant.int 1 %6755 = torch.aten.add.Scalar %6754, %float9.999990e-07_8814, %int1_8815 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %6756 = torch.aten.rsqrt %6755 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %6757 = torch.aten.mul.Tensor %6751, %6756 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %6758 = torch.aten.mul.Tensor %6757, %205 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %6759 = torch_c.to_builtin_tensor %6758 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8816 = tensor.cast %6759 : tensor<4x1x3200xf32> to tensor %6760 = torch_c.to_builtin_tensor %206 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %6761 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_8816, %6760) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_8817 = tensor.cast %6761 : tensor to tensor<4x1x8640xf32> %6762 = torch_c.from_builtin_tensor %cast_8817 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %6763 = torch.aten.silu %6762 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %6764 = torch_c.to_builtin_tensor %6758 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8818 = tensor.cast %6764 : tensor<4x1x3200xf32> to tensor %6765 = torch_c.to_builtin_tensor %207 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %6766 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_8818, %6765) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_8819 = tensor.cast %6766 : tensor to tensor<4x1x8640xf32> %6767 = torch_c.from_builtin_tensor %cast_8819 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %6768 = torch.aten.mul.Tensor %6763, %6767 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %6769 = torch_c.to_builtin_tensor %6768 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_8820 = tensor.cast %6769 : tensor<4x1x8640xf32> to tensor %6770 = torch_c.to_builtin_tensor %208 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %6771 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_8820, %6770) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_8821 = tensor.cast %6771 : tensor to tensor<4x1x3200xf32> %6772 = torch_c.from_builtin_tensor %cast_8821 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_8822 = torch.constant.int 1 %6773 = torch.aten.add.Tensor %6751, %6772, %int1_8822 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_8823 = torch.constant.int 2 %6774 = torch.aten.pow.Tensor_Scalar %6773, %int2_8823 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_8824 = torch.constant.int -1 %6775 = torch.prim.ListConstruct %int-1_8824 : (!torch.int) -> !torch.list %true_8825 = torch.constant.bool true %none_8826 = torch.constant.none %6776 = torch.aten.mean.dim %6774, %6775, %true_8825, %none_8826 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_8827 = torch.constant.float 9.9999999747524271E-7 %int1_8828 = torch.constant.int 1 %6777 = torch.aten.add.Scalar %6776, %float9.999990e-07_8827, %int1_8828 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %6778 = torch.aten.rsqrt %6777 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %6779 = torch.aten.mul.Tensor %6773, %6778 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %6780 = torch.aten.mul.Tensor %6779, %209 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %6781 = torch_c.to_builtin_tensor %6780 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8829 = tensor.cast %6781 : tensor<4x1x3200xf32> to tensor %6782 = torch_c.to_builtin_tensor %210 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6783 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8829, %6782) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8830 = tensor.cast %6783 : tensor to tensor<4x1x3200xf32> %6784 = torch_c.from_builtin_tensor %cast_8830 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %6785 = torch_c.to_builtin_tensor %6780 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8831 = tensor.cast %6785 : tensor<4x1x3200xf32> to tensor %6786 = torch_c.to_builtin_tensor %211 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6787 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8831, %6786) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8832 = tensor.cast %6787 : tensor to tensor<4x1x3200xf32> %6788 = torch_c.from_builtin_tensor %cast_8832 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %6789 = torch_c.to_builtin_tensor %6780 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_8833 = tensor.cast %6789 : tensor<4x1x3200xf32> to tensor %6790 = torch_c.to_builtin_tensor %212 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %6791 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_8833, %6790) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_8834 = tensor.cast %6791 : tensor to tensor<4x1x3200xf32> %6792 = torch_c.from_builtin_tensor %cast_8834 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_8835 = torch.constant.int 4 %int1_8836 = torch.constant.int 1 %int32_8837 = torch.constant.int 32 %int100_8838 = torch.constant.int 100 %6793 = torch.prim.ListConstruct %int4_8835, %int1_8836, %int32_8837, %int100_8838 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6794 = torch.aten.view %6784, %6793 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_8839 = torch.constant.int 4 %int1_8840 = torch.constant.int 1 %int32_8841 = torch.constant.int 32 %int100_8842 = torch.constant.int 100 %6795 = torch.prim.ListConstruct %int4_8839, %int1_8840, %int32_8841, %int100_8842 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6796 = torch.aten.view %6788, %6795 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_8843 = torch.constant.int 4 %int1_8844 = torch.constant.int 1 %int32_8845 = torch.constant.int 32 %int100_8846 = torch.constant.int 100 %6797 = torch.prim.ListConstruct %int4_8843, %int1_8844, %int32_8845, %int100_8846 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6798 = torch.aten.view %6792, %6797 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_8847 = torch.constant.int 4 %int1_8848 = torch.constant.int 1 %int32_8849 = torch.constant.int 32 %int-1_8850 = torch.constant.int -1 %int2_8851 = torch.constant.int 2 %6799 = torch.prim.ListConstruct %int4_8847, %int1_8848, %int32_8849, %int-1_8850, %int2_8851 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6800 = torch.aten.view %6794, %6799 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %6801 = torch.aten.view_as_complex %6800 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_8852 = torch.constant.int 4 %int1_8853 = torch.constant.int 1 %int32_8854 = torch.constant.int 32 %int-1_8855 = torch.constant.int -1 %int2_8856 = torch.constant.int 2 %6802 = torch.prim.ListConstruct %int4_8852, %int1_8853, %int32_8854, %int-1_8855, %int2_8856 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6803 = torch.aten.view %6796, %6802 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %6804 = torch.aten.view_as_complex %6803 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %6805 = torch.aten.mul.Tensor %6801, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %6806 = torch.aten.view_as_real %6805 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_8857 = torch.constant.int 4 %int1_8858 = torch.constant.int 1 %int32_8859 = torch.constant.int 32 %int100_8860 = torch.constant.int 100 %6807 = torch.prim.ListConstruct %int4_8857, %int1_8858, %int32_8859, %int100_8860 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6808 = torch.aten.view %6806, %6807 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %6809 = torch.aten.mul.Tensor %6804, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %6810 = torch.aten.view_as_real %6809 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_8861 = torch.constant.int 4 %int1_8862 = torch.constant.int 1 %int32_8863 = torch.constant.int 32 %int100_8864 = torch.constant.int 100 %6811 = torch.prim.ListConstruct %int4_8861, %int1_8862, %int32_8863, %int100_8864 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6812 = torch.aten.view %6810, %6811 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_8865 = torch.constant.int 1 %int1_8866 = torch.constant.int 1 %6813 = torch.aten.add.Scalar %arg2, %int1_8865, %int1_8866 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_8867 = torch.constant.int 0 %int0_8868 = torch.constant.int 0 %6814 = torch.aten.select.int %6813, %int0_8867, %int0_8868 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8869 = torch.constant.int 0 %int0_8870 = torch.constant.int 0 %6815 = torch.aten.select.int %arg3, %int0_8869, %int0_8870 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8871 = torch.constant.int 0 %int0_8872 = torch.constant.int 0 %int9223372036854775807_8873 = torch.constant.int 9223372036854775807 %int1_8874 = torch.constant.int 1 %6816 = torch.aten.slice.Tensor %6815, %int0_8871, %int0_8872, %int9223372036854775807_8873, %int1_8874 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8875 = torch.constant.int 16 %6817 = torch.aten.floor_divide.Scalar %6814, %int16_8875 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8876 = torch.constant.int 0 %6818 = torch.aten.index_select %6816, %int0_8876, %6817 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8877 = torch.constant.int 16 %6819 = torch.aten.remainder.Scalar %6814, %int16_8877 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8878 = torch.constant.none %6820 = torch.aten.clone %606, %none_8878 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8879 = torch.constant.none %6821 = torch.aten.clone %607, %none_8879 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8880 = torch.constant.int 0 %6822 = torch.aten.unsqueeze %6819, %int0_8880 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8881 = torch.constant.int 0 %int0_8882 = torch.constant.int 0 %6823 = torch.aten.select.int %6812, %int0_8881, %int0_8882 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8883 = torch.constant.int 0 %int0_8884 = torch.constant.int 0 %6824 = torch.aten.select.int %6823, %int0_8883, %int0_8884 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_8885 = torch.constant.int -1 %int26_8886 = torch.constant.int 26 %int2_8887 = torch.constant.int 2 %int16_8888 = torch.constant.int 16 %int32_8889 = torch.constant.int 32 %int100_8890 = torch.constant.int 100 %6825 = torch.prim.ListConstruct %int-1_8885, %int26_8886, %int2_8887, %int16_8888, %int32_8889, %int100_8890 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6826 = torch.aten.view %6660, %6825 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %6827 = torch.prim.ListConstruct %6818, %6820, %6821, %6822 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8891 = torch.constant.bool false %6828 = torch.aten.index_put %6826, %6827, %6824, %false_8891 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8892 = torch.constant.int 2662400 %6829 = torch.prim.ListConstruct %731, %int2662400_8892 : (!torch.int, !torch.int) -> !torch.list %6830 = torch.aten.view %6828, %6829 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8893 = torch.constant.int -1 %int26_8894 = torch.constant.int 26 %int2_8895 = torch.constant.int 2 %int16_8896 = torch.constant.int 16 %int32_8897 = torch.constant.int 32 %int100_8898 = torch.constant.int 100 %6831 = torch.prim.ListConstruct %int-1_8893, %int26_8894, %int2_8895, %int16_8896, %int32_8897, %int100_8898 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6832 = torch.aten.view %6830, %6831 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8899 = torch.constant.none %6833 = torch.aten.clone %608, %none_8899 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8900 = torch.constant.none %6834 = torch.aten.clone %609, %none_8900 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8901 = torch.constant.int 0 %6835 = torch.aten.unsqueeze %6819, %int0_8901 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8902 = torch.constant.int 0 %int0_8903 = torch.constant.int 0 %6836 = torch.aten.select.int %6798, %int0_8902, %int0_8903 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8904 = torch.constant.int 0 %int0_8905 = torch.constant.int 0 %6837 = torch.aten.select.int %6836, %int0_8904, %int0_8905 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6838 = torch.prim.ListConstruct %6818, %6833, %6834, %6835 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8906 = torch.constant.bool false %6839 = torch.aten.index_put %6832, %6838, %6837, %false_8906 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8907 = torch.constant.int 2662400 %6840 = torch.prim.ListConstruct %731, %int2662400_8907 : (!torch.int, !torch.int) -> !torch.list %6841 = torch.aten.view %6839, %6840 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8908 = torch.constant.int -1 %int26_8909 = torch.constant.int 26 %int2_8910 = torch.constant.int 2 %int16_8911 = torch.constant.int 16 %int32_8912 = torch.constant.int 32 %int100_8913 = torch.constant.int 100 %6842 = torch.prim.ListConstruct %int-1_8908, %int26_8909, %int2_8910, %int16_8911, %int32_8912, %int100_8913 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6843 = torch.aten.view %6841, %6842 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_8914 = torch.constant.int 0 %int1_8915 = torch.constant.int 1 %6844 = torch.aten.select.int %6813, %int0_8914, %int1_8915 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8916 = torch.constant.int 0 %int1_8917 = torch.constant.int 1 %6845 = torch.aten.select.int %arg3, %int0_8916, %int1_8917 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8918 = torch.constant.int 0 %int0_8919 = torch.constant.int 0 %int9223372036854775807_8920 = torch.constant.int 9223372036854775807 %int1_8921 = torch.constant.int 1 %6846 = torch.aten.slice.Tensor %6845, %int0_8918, %int0_8919, %int9223372036854775807_8920, %int1_8921 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8922 = torch.constant.int 16 %6847 = torch.aten.floor_divide.Scalar %6844, %int16_8922 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8923 = torch.constant.int 0 %6848 = torch.aten.index_select %6846, %int0_8923, %6847 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8924 = torch.constant.int 16 %6849 = torch.aten.remainder.Scalar %6844, %int16_8924 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8925 = torch.constant.none %6850 = torch.aten.clone %610, %none_8925 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8926 = torch.constant.none %6851 = torch.aten.clone %611, %none_8926 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8927 = torch.constant.int 0 %6852 = torch.aten.unsqueeze %6849, %int0_8927 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8928 = torch.constant.int 0 %int1_8929 = torch.constant.int 1 %6853 = torch.aten.select.int %6812, %int0_8928, %int1_8929 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8930 = torch.constant.int 0 %int0_8931 = torch.constant.int 0 %6854 = torch.aten.select.int %6853, %int0_8930, %int0_8931 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6855 = torch.prim.ListConstruct %6848, %6850, %6851, %6852 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8932 = torch.constant.bool false %6856 = torch.aten.index_put %6843, %6855, %6854, %false_8932 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8933 = torch.constant.int 2662400 %6857 = torch.prim.ListConstruct %731, %int2662400_8933 : (!torch.int, !torch.int) -> !torch.list %6858 = torch.aten.view %6856, %6857 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8934 = torch.constant.int -1 %int26_8935 = torch.constant.int 26 %int2_8936 = torch.constant.int 2 %int16_8937 = torch.constant.int 16 %int32_8938 = torch.constant.int 32 %int100_8939 = torch.constant.int 100 %6859 = torch.prim.ListConstruct %int-1_8934, %int26_8935, %int2_8936, %int16_8937, %int32_8938, %int100_8939 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6860 = torch.aten.view %6858, %6859 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8940 = torch.constant.none %6861 = torch.aten.clone %612, %none_8940 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8941 = torch.constant.none %6862 = torch.aten.clone %613, %none_8941 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8942 = torch.constant.int 0 %6863 = torch.aten.unsqueeze %6849, %int0_8942 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8943 = torch.constant.int 0 %int1_8944 = torch.constant.int 1 %6864 = torch.aten.select.int %6798, %int0_8943, %int1_8944 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8945 = torch.constant.int 0 %int0_8946 = torch.constant.int 0 %6865 = torch.aten.select.int %6864, %int0_8945, %int0_8946 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6866 = torch.prim.ListConstruct %6848, %6861, %6862, %6863 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8947 = torch.constant.bool false %6867 = torch.aten.index_put %6860, %6866, %6865, %false_8947 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8948 = torch.constant.int 2662400 %6868 = torch.prim.ListConstruct %731, %int2662400_8948 : (!torch.int, !torch.int) -> !torch.list %6869 = torch.aten.view %6867, %6868 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8949 = torch.constant.int -1 %int26_8950 = torch.constant.int 26 %int2_8951 = torch.constant.int 2 %int16_8952 = torch.constant.int 16 %int32_8953 = torch.constant.int 32 %int100_8954 = torch.constant.int 100 %6870 = torch.prim.ListConstruct %int-1_8949, %int26_8950, %int2_8951, %int16_8952, %int32_8953, %int100_8954 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6871 = torch.aten.view %6869, %6870 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_8955 = torch.constant.int 0 %int2_8956 = torch.constant.int 2 %6872 = torch.aten.select.int %6813, %int0_8955, %int2_8956 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8957 = torch.constant.int 0 %int2_8958 = torch.constant.int 2 %6873 = torch.aten.select.int %arg3, %int0_8957, %int2_8958 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_8959 = torch.constant.int 0 %int0_8960 = torch.constant.int 0 %int9223372036854775807_8961 = torch.constant.int 9223372036854775807 %int1_8962 = torch.constant.int 1 %6874 = torch.aten.slice.Tensor %6873, %int0_8959, %int0_8960, %int9223372036854775807_8961, %int1_8962 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_8963 = torch.constant.int 16 %6875 = torch.aten.floor_divide.Scalar %6872, %int16_8963 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_8964 = torch.constant.int 0 %6876 = torch.aten.index_select %6874, %int0_8964, %6875 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_8965 = torch.constant.int 16 %6877 = torch.aten.remainder.Scalar %6872, %int16_8965 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_8966 = torch.constant.none %6878 = torch.aten.clone %614, %none_8966 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8967 = torch.constant.none %6879 = torch.aten.clone %615, %none_8967 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8968 = torch.constant.int 0 %6880 = torch.aten.unsqueeze %6877, %int0_8968 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8969 = torch.constant.int 0 %int2_8970 = torch.constant.int 2 %6881 = torch.aten.select.int %6812, %int0_8969, %int2_8970 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8971 = torch.constant.int 0 %int0_8972 = torch.constant.int 0 %6882 = torch.aten.select.int %6881, %int0_8971, %int0_8972 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6883 = torch.prim.ListConstruct %6876, %6878, %6879, %6880 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8973 = torch.constant.bool false %6884 = torch.aten.index_put %6871, %6883, %6882, %false_8973 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8974 = torch.constant.int 2662400 %6885 = torch.prim.ListConstruct %731, %int2662400_8974 : (!torch.int, !torch.int) -> !torch.list %6886 = torch.aten.view %6884, %6885 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8975 = torch.constant.int -1 %int26_8976 = torch.constant.int 26 %int2_8977 = torch.constant.int 2 %int16_8978 = torch.constant.int 16 %int32_8979 = torch.constant.int 32 %int100_8980 = torch.constant.int 100 %6887 = torch.prim.ListConstruct %int-1_8975, %int26_8976, %int2_8977, %int16_8978, %int32_8979, %int100_8980 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6888 = torch.aten.view %6886, %6887 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_8981 = torch.constant.none %6889 = torch.aten.clone %616, %none_8981 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_8982 = torch.constant.none %6890 = torch.aten.clone %617, %none_8982 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_8983 = torch.constant.int 0 %6891 = torch.aten.unsqueeze %6877, %int0_8983 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_8984 = torch.constant.int 0 %int2_8985 = torch.constant.int 2 %6892 = torch.aten.select.int %6798, %int0_8984, %int2_8985 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_8986 = torch.constant.int 0 %int0_8987 = torch.constant.int 0 %6893 = torch.aten.select.int %6892, %int0_8986, %int0_8987 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6894 = torch.prim.ListConstruct %6876, %6889, %6890, %6891 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_8988 = torch.constant.bool false %6895 = torch.aten.index_put %6888, %6894, %6893, %false_8988 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_8989 = torch.constant.int 2662400 %6896 = torch.prim.ListConstruct %731, %int2662400_8989 : (!torch.int, !torch.int) -> !torch.list %6897 = torch.aten.view %6895, %6896 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_8990 = torch.constant.int -1 %int26_8991 = torch.constant.int 26 %int2_8992 = torch.constant.int 2 %int16_8993 = torch.constant.int 16 %int32_8994 = torch.constant.int 32 %int100_8995 = torch.constant.int 100 %6898 = torch.prim.ListConstruct %int-1_8990, %int26_8991, %int2_8992, %int16_8993, %int32_8994, %int100_8995 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6899 = torch.aten.view %6897, %6898 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_8996 = torch.constant.int 0 %int3_8997 = torch.constant.int 3 %6900 = torch.aten.select.int %6813, %int0_8996, %int3_8997 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_8998 = torch.constant.int 0 %int3_8999 = torch.constant.int 3 %6901 = torch.aten.select.int %arg3, %int0_8998, %int3_8999 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_9000 = torch.constant.int 0 %int0_9001 = torch.constant.int 0 %int9223372036854775807_9002 = torch.constant.int 9223372036854775807 %int1_9003 = torch.constant.int 1 %6902 = torch.aten.slice.Tensor %6901, %int0_9000, %int0_9001, %int9223372036854775807_9002, %int1_9003 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_9004 = torch.constant.int 16 %6903 = torch.aten.floor_divide.Scalar %6900, %int16_9004 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_9005 = torch.constant.int 0 %6904 = torch.aten.index_select %6902, %int0_9005, %6903 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_9006 = torch.constant.int 16 %6905 = torch.aten.remainder.Scalar %6900, %int16_9006 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_9007 = torch.constant.none %6906 = torch.aten.clone %618, %none_9007 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9008 = torch.constant.none %6907 = torch.aten.clone %619, %none_9008 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9009 = torch.constant.int 0 %6908 = torch.aten.unsqueeze %6905, %int0_9009 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9010 = torch.constant.int 0 %int3_9011 = torch.constant.int 3 %6909 = torch.aten.select.int %6812, %int0_9010, %int3_9011 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9012 = torch.constant.int 0 %int0_9013 = torch.constant.int 0 %6910 = torch.aten.select.int %6909, %int0_9012, %int0_9013 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6911 = torch.prim.ListConstruct %6904, %6906, %6907, %6908 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9014 = torch.constant.bool false %6912 = torch.aten.index_put %6899, %6911, %6910, %false_9014 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9015 = torch.constant.int 2662400 %6913 = torch.prim.ListConstruct %731, %int2662400_9015 : (!torch.int, !torch.int) -> !torch.list %6914 = torch.aten.view %6912, %6913 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9016 = torch.constant.int -1 %int26_9017 = torch.constant.int 26 %int2_9018 = torch.constant.int 2 %int16_9019 = torch.constant.int 16 %int32_9020 = torch.constant.int 32 %int100_9021 = torch.constant.int 100 %6915 = torch.prim.ListConstruct %int-1_9016, %int26_9017, %int2_9018, %int16_9019, %int32_9020, %int100_9021 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6916 = torch.aten.view %6914, %6915 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_9022 = torch.constant.none %6917 = torch.aten.clone %620, %none_9022 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9023 = torch.constant.none %6918 = torch.aten.clone %621, %none_9023 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9024 = torch.constant.int 0 %6919 = torch.aten.unsqueeze %6905, %int0_9024 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9025 = torch.constant.int 0 %int3_9026 = torch.constant.int 3 %6920 = torch.aten.select.int %6798, %int0_9025, %int3_9026 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9027 = torch.constant.int 0 %int0_9028 = torch.constant.int 0 %6921 = torch.aten.select.int %6920, %int0_9027, %int0_9028 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %6922 = torch.prim.ListConstruct %6904, %6917, %6918, %6919 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9029 = torch.constant.bool false %6923 = torch.aten.index_put %6916, %6922, %6921, %false_9029 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9030 = torch.constant.int 2662400 %6924 = torch.prim.ListConstruct %731, %int2662400_9030 : (!torch.int, !torch.int) -> !torch.list %6925 = torch.aten.view %6923, %6924 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_9031 = torch.constant.int 52 %6926 = torch.aten.mul.Scalar %arg3, %int52_9031 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int46 = torch.constant.int 46 %int1_9032 = torch.constant.int 1 %6927 = torch.aten.add.Scalar %6926, %int46, %int1_9032 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_9033 = torch.constant.int 4 %6928 = torch.aten.mul.int %int4_9033, %655 : !torch.int, !torch.int -> !torch.int %6929 = torch.prim.ListConstruct %6928 : (!torch.int) -> !torch.list %6930 = torch.aten.view %6927, %6929 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_9034 = torch.constant.int -1 %int26_9035 = torch.constant.int 26 %int2_9036 = torch.constant.int 2 %int16_9037 = torch.constant.int 16 %int32_9038 = torch.constant.int 32 %int100_9039 = torch.constant.int 100 %6931 = torch.prim.ListConstruct %int-1_9034, %int26_9035, %int2_9036, %int16_9037, %int32_9038, %int100_9039 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6932 = torch.aten.view %6925, %6931 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_9040 = torch.constant.int 26 %6933 = torch.aten.mul.int %731, %int26_9040 : !torch.int, !torch.int -> !torch.int %int2_9041 = torch.constant.int 2 %6934 = torch.aten.mul.int %6933, %int2_9041 : !torch.int, !torch.int -> !torch.int %int16_9042 = torch.constant.int 16 %int32_9043 = torch.constant.int 32 %int100_9044 = torch.constant.int 100 %6935 = torch.prim.ListConstruct %6934, %int16_9042, %int32_9043, %int100_9044 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6936 = torch.aten.view %6932, %6935 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_9045 = torch.constant.int 0 %6937 = torch.aten.index_select %6936, %int0_9045, %6930 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_9046 = torch.constant.int 4 %int16_9047 = torch.constant.int 16 %int32_9048 = torch.constant.int 32 %int100_9049 = torch.constant.int 100 %6938 = torch.prim.ListConstruct %int4_9046, %655, %int16_9047, %int32_9048, %int100_9049 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6939 = torch.aten.view %6937, %6938 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_9050 = torch.constant.int 1 %6940 = torch.aten.size.int %6939, %int1_9050 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_9051 = torch.constant.int 16 %6941 = torch.aten.mul.int %6940, %int16_9051 : !torch.int, !torch.int -> !torch.int %int4_9052 = torch.constant.int 4 %int32_9053 = torch.constant.int 32 %int100_9054 = torch.constant.int 100 %6942 = torch.prim.ListConstruct %int4_9052, %6941, %int32_9053, %int100_9054 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6943 = torch.aten.view %6939, %6942 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_9055 = torch.constant.int 0 %int0_9056 = torch.constant.int 0 %int9223372036854775807_9057 = torch.constant.int 9223372036854775807 %int1_9058 = torch.constant.int 1 %6944 = torch.aten.slice.Tensor %6685, %int0_9055, %int0_9056, %int9223372036854775807_9057, %int1_9058 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_9059 = torch.constant.int 16 %6945 = torch.aten.mul.int %655, %int16_9059 : !torch.int, !torch.int -> !torch.int %int1_9060 = torch.constant.int 1 %int0_9061 = torch.constant.int 0 %int1_9062 = torch.constant.int 1 %6946 = torch.aten.slice.Tensor %6944, %int1_9060, %int0_9061, %6945, %int1_9062 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_9063 = torch.constant.bool false %6947 = torch.aten.copy %6946, %6943, %false_9063 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_9064 = torch.constant.int 0 %int0_9065 = torch.constant.int 0 %int9223372036854775807_9066 = torch.constant.int 9223372036854775807 %int1_9067 = torch.constant.int 1 %6948 = torch.aten.slice.Tensor %6685, %int0_9064, %int0_9065, %int9223372036854775807_9066, %int1_9067 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9068 = torch.constant.int 1 %int0_9069 = torch.constant.int 0 %int1_9070 = torch.constant.int 1 %6949 = torch.aten.slice_scatter %6948, %6947, %int1_9068, %int0_9069, %6945, %int1_9070 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_9071 = torch.constant.int 0 %int0_9072 = torch.constant.int 0 %int9223372036854775807_9073 = torch.constant.int 9223372036854775807 %int1_9074 = torch.constant.int 1 %6950 = torch.aten.slice_scatter %6685, %6949, %int0_9071, %int0_9072, %int9223372036854775807_9073, %int1_9074 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9075 = torch.constant.int 1 %int1_9076 = torch.constant.int 1 %6951 = torch.aten.add.Scalar %6927, %int1_9075, %int1_9076 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_9077 = torch.constant.int 4 %6952 = torch.aten.mul.int %int4_9077, %655 : !torch.int, !torch.int -> !torch.int %6953 = torch.prim.ListConstruct %6952 : (!torch.int) -> !torch.list %6954 = torch.aten.view %6951, %6953 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_9078 = torch.constant.int 0 %6955 = torch.aten.index_select %6936, %int0_9078, %6954 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_9079 = torch.constant.int 4 %int16_9080 = torch.constant.int 16 %int32_9081 = torch.constant.int 32 %int100_9082 = torch.constant.int 100 %6956 = torch.prim.ListConstruct %int4_9079, %655, %int16_9080, %int32_9081, %int100_9082 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6957 = torch.aten.view %6955, %6956 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_9083 = torch.constant.int 1 %6958 = torch.aten.size.int %6957, %int1_9083 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_9084 = torch.constant.int 16 %6959 = torch.aten.mul.int %6958, %int16_9084 : !torch.int, !torch.int -> !torch.int %int4_9085 = torch.constant.int 4 %int32_9086 = torch.constant.int 32 %int100_9087 = torch.constant.int 100 %6960 = torch.prim.ListConstruct %int4_9085, %6959, %int32_9086, %int100_9087 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6961 = torch.aten.view %6957, %6960 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_9088 = torch.constant.int 0 %int0_9089 = torch.constant.int 0 %int9223372036854775807_9090 = torch.constant.int 9223372036854775807 %int1_9091 = torch.constant.int 1 %6962 = torch.aten.slice.Tensor %6702, %int0_9088, %int0_9089, %int9223372036854775807_9090, %int1_9091 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9092 = torch.constant.int 1 %int0_9093 = torch.constant.int 0 %int1_9094 = torch.constant.int 1 %6963 = torch.aten.slice.Tensor %6962, %int1_9092, %int0_9093, %6945, %int1_9094 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_9095 = torch.constant.bool false %6964 = torch.aten.copy %6963, %6961, %false_9095 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_9096 = torch.constant.int 0 %int0_9097 = torch.constant.int 0 %int9223372036854775807_9098 = torch.constant.int 9223372036854775807 %int1_9099 = torch.constant.int 1 %6965 = torch.aten.slice.Tensor %6702, %int0_9096, %int0_9097, %int9223372036854775807_9098, %int1_9099 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9100 = torch.constant.int 1 %int0_9101 = torch.constant.int 0 %int1_9102 = torch.constant.int 1 %6966 = torch.aten.slice_scatter %6965, %6964, %int1_9100, %int0_9101, %6945, %int1_9102 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_9103 = torch.constant.int 0 %int0_9104 = torch.constant.int 0 %int9223372036854775807_9105 = torch.constant.int 9223372036854775807 %int1_9106 = torch.constant.int 1 %6967 = torch.aten.slice_scatter %6702, %6966, %int0_9103, %int0_9104, %int9223372036854775807_9105, %int1_9106 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_9107 = torch.constant.int 0 %int0_9108 = torch.constant.int 0 %int9223372036854775807_9109 = torch.constant.int 9223372036854775807 %int1_9110 = torch.constant.int 1 %6968 = torch.aten.slice.Tensor %671, %int0_9107, %int0_9108, %int9223372036854775807_9109, %int1_9110 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9111 = torch.constant.int 1 %int0_9112 = torch.constant.int 0 %int1_9113 = torch.constant.int 1 %6969 = torch.aten.slice.Tensor %6968, %int1_9111, %int0_9112, %6945, %int1_9113 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_9114 = torch.constant.int 0 %int0_9115 = torch.constant.int 0 %int9223372036854775807_9116 = torch.constant.int 9223372036854775807 %int1_9117 = torch.constant.int 1 %6970 = torch.aten.slice.Tensor %673, %int0_9114, %int0_9115, %int9223372036854775807_9116, %int1_9117 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9118 = torch.constant.int 1 %int0_9119 = torch.constant.int 0 %int1_9120 = torch.constant.int 1 %6971 = torch.aten.slice.Tensor %6970, %int1_9118, %int0_9119, %6945, %int1_9120 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_9121 = torch.constant.int 1 %int2_9122 = torch.constant.int 2 %6972 = torch.aten.transpose.int %6808, %int1_9121, %int2_9122 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_9123 = torch.constant.int 4 %int32_9124 = torch.constant.int 32 %int1_9125 = torch.constant.int 1 %int100_9126 = torch.constant.int 100 %6973 = torch.prim.ListConstruct %int4_9123, %int32_9124, %int1_9125, %int100_9126 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9127 = torch.constant.bool false %6974 = torch.aten.expand %6972, %6973, %false_9127 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_9128 = torch.constant.int 128 %int1_9129 = torch.constant.int 1 %int100_9130 = torch.constant.int 100 %6975 = torch.prim.ListConstruct %int128_9128, %int1_9129, %int100_9130 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6976 = torch.aten.view %6974, %6975 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_9131 = torch.constant.int 0 %int0_9132 = torch.constant.int 0 %int9223372036854775807_9133 = torch.constant.int 9223372036854775807 %int1_9134 = torch.constant.int 1 %6977 = torch.aten.slice.Tensor %6950, %int0_9131, %int0_9132, %int9223372036854775807_9133, %int1_9134 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9135 = torch.constant.int 1 %int0_9136 = torch.constant.int 0 %int1_9137 = torch.constant.int 1 %6978 = torch.aten.slice.Tensor %6977, %int1_9135, %int0_9136, %6945, %int1_9137 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_9138 = torch.constant.int 1 %int2_9139 = torch.constant.int 2 %6979 = torch.aten.transpose.int %6978, %int1_9138, %int2_9139 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_9140 = torch.constant.int 2 %int3_9141 = torch.constant.int 3 %6980 = torch.aten.transpose.int %6979, %int2_9140, %int3_9141 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_9142 = torch.constant.int 1 %6981 = torch.aten.size.int %6969, %int1_9142 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_9143 = torch.constant.int 4 %int32_9144 = torch.constant.int 32 %int100_9145 = torch.constant.int 100 %6982 = torch.prim.ListConstruct %int4_9143, %int32_9144, %int100_9145, %6981 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9146 = torch.constant.bool false %6983 = torch.aten.expand %6980, %6982, %false_9146 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_9147 = torch.constant.int 0 %6984 = torch.aten.clone %6983, %int0_9147 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_9148 = torch.constant.int 128 %int100_9149 = torch.constant.int 100 %6985 = torch.prim.ListConstruct %int128_9148, %int100_9149, %6981 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6986 = torch.aten._unsafe_view %6984, %6985 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %6987 = torch.aten.bmm %6976, %6986 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_9150 = torch.constant.int 4 %int32_9151 = torch.constant.int 32 %int1_9152 = torch.constant.int 1 %6988 = torch.prim.ListConstruct %int4_9150, %int32_9151, %int1_9152, %6981 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %6989 = torch.aten.view %6987, %6988 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_9153 = torch.constant.float 1.000000e+01 %6990 = torch.aten.div.Scalar %6989, %float1.000000e01_9153 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_9154 = torch.constant.int 1 %6991 = torch.aten.add.Tensor %6990, %895, %int1_9154 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_9155 = torch.constant.int -1 %false_9156 = torch.constant.bool false %6992 = torch.aten._softmax %6991, %int-1_9155, %false_9156 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_9157 = torch.constant.int 4 %int32_9158 = torch.constant.int 32 %int1_9159 = torch.constant.int 1 %6993 = torch.prim.ListConstruct %int4_9157, %int32_9158, %int1_9159, %6981 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9160 = torch.constant.bool false %6994 = torch.aten.expand %6992, %6993, %false_9160 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_9161 = torch.constant.int 128 %int1_9162 = torch.constant.int 1 %6995 = torch.prim.ListConstruct %int128_9161, %int1_9162, %6981 : (!torch.int, !torch.int, !torch.int) -> !torch.list %6996 = torch.aten.view %6994, %6995 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_9163 = torch.constant.int 0 %int0_9164 = torch.constant.int 0 %int9223372036854775807_9165 = torch.constant.int 9223372036854775807 %int1_9166 = torch.constant.int 1 %6997 = torch.aten.slice.Tensor %6967, %int0_9163, %int0_9164, %int9223372036854775807_9165, %int1_9166 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9167 = torch.constant.int 1 %int0_9168 = torch.constant.int 0 %int1_9169 = torch.constant.int 1 %6998 = torch.aten.slice.Tensor %6997, %int1_9167, %int0_9168, %6945, %int1_9169 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_9170 = torch.constant.int 1 %int2_9171 = torch.constant.int 2 %6999 = torch.aten.transpose.int %6998, %int1_9170, %int2_9171 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_9172 = torch.constant.int 1 %7000 = torch.aten.size.int %6971, %int1_9172 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_9173 = torch.constant.int 4 %int32_9174 = torch.constant.int 32 %int100_9175 = torch.constant.int 100 %7001 = torch.prim.ListConstruct %int4_9173, %int32_9174, %7000, %int100_9175 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9176 = torch.constant.bool false %7002 = torch.aten.expand %6999, %7001, %false_9176 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_9177 = torch.constant.int 0 %7003 = torch.aten.clone %7002, %int0_9177 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_9178 = torch.constant.int 128 %int100_9179 = torch.constant.int 100 %7004 = torch.prim.ListConstruct %int128_9178, %7000, %int100_9179 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7005 = torch.aten._unsafe_view %7003, %7004 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %7006 = torch.aten.bmm %6996, %7005 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_9180 = torch.constant.int 4 %int32_9181 = torch.constant.int 32 %int1_9182 = torch.constant.int 1 %int100_9183 = torch.constant.int 100 %7007 = torch.prim.ListConstruct %int4_9180, %int32_9181, %int1_9182, %int100_9183 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7008 = torch.aten.view %7006, %7007 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_9184 = torch.constant.int 1 %int2_9185 = torch.constant.int 2 %7009 = torch.aten.transpose.int %7008, %int1_9184, %int2_9185 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_9186 = torch.constant.int 4 %int1_9187 = torch.constant.int 1 %int-1_9188 = torch.constant.int -1 %7010 = torch.prim.ListConstruct %int4_9186, %int1_9187, %int-1_9188 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7011 = torch.aten.view %7009, %7010 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %7012 = torch_c.to_builtin_tensor %7011 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9189 = tensor.cast %7012 : tensor<4x1x3200xf32> to tensor %7013 = torch_c.to_builtin_tensor %213 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %7014 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_9189, %7013) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_9190 = tensor.cast %7014 : tensor to tensor<4x1x3200xf32> %7015 = torch_c.from_builtin_tensor %cast_9190 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_9191 = torch.constant.int 1 %7016 = torch.aten.add.Tensor %6773, %7015, %int1_9191 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_9192 = torch.constant.int 2 %7017 = torch.aten.pow.Tensor_Scalar %7016, %int2_9192 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_9193 = torch.constant.int -1 %7018 = torch.prim.ListConstruct %int-1_9193 : (!torch.int) -> !torch.list %true_9194 = torch.constant.bool true %none_9195 = torch.constant.none %7019 = torch.aten.mean.dim %7017, %7018, %true_9194, %none_9195 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_9196 = torch.constant.float 9.9999999747524271E-7 %int1_9197 = torch.constant.int 1 %7020 = torch.aten.add.Scalar %7019, %float9.999990e-07_9196, %int1_9197 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %7021 = torch.aten.rsqrt %7020 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %7022 = torch.aten.mul.Tensor %7016, %7021 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %7023 = torch.aten.mul.Tensor %7022, %214 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %7024 = torch_c.to_builtin_tensor %7023 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9198 = tensor.cast %7024 : tensor<4x1x3200xf32> to tensor %7025 = torch_c.to_builtin_tensor %215 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %7026 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_9198, %7025) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_9199 = tensor.cast %7026 : tensor to tensor<4x1x8640xf32> %7027 = torch_c.from_builtin_tensor %cast_9199 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %7028 = torch.aten.silu %7027 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %7029 = torch_c.to_builtin_tensor %7023 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9200 = tensor.cast %7029 : tensor<4x1x3200xf32> to tensor %7030 = torch_c.to_builtin_tensor %216 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %7031 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_9200, %7030) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_9201 = tensor.cast %7031 : tensor to tensor<4x1x8640xf32> %7032 = torch_c.from_builtin_tensor %cast_9201 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %7033 = torch.aten.mul.Tensor %7028, %7032 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %7034 = torch_c.to_builtin_tensor %7033 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_9202 = tensor.cast %7034 : tensor<4x1x8640xf32> to tensor %7035 = torch_c.to_builtin_tensor %217 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %7036 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_9202, %7035) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_9203 = tensor.cast %7036 : tensor to tensor<4x1x3200xf32> %7037 = torch_c.from_builtin_tensor %cast_9203 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_9204 = torch.constant.int 1 %7038 = torch.aten.add.Tensor %7016, %7037, %int1_9204 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_9205 = torch.constant.int 2 %7039 = torch.aten.pow.Tensor_Scalar %7038, %int2_9205 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_9206 = torch.constant.int -1 %7040 = torch.prim.ListConstruct %int-1_9206 : (!torch.int) -> !torch.list %true_9207 = torch.constant.bool true %none_9208 = torch.constant.none %7041 = torch.aten.mean.dim %7039, %7040, %true_9207, %none_9208 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_9209 = torch.constant.float 9.9999999747524271E-7 %int1_9210 = torch.constant.int 1 %7042 = torch.aten.add.Scalar %7041, %float9.999990e-07_9209, %int1_9210 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %7043 = torch.aten.rsqrt %7042 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %7044 = torch.aten.mul.Tensor %7038, %7043 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %7045 = torch.aten.mul.Tensor %7044, %218 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %7046 = torch_c.to_builtin_tensor %7045 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9211 = tensor.cast %7046 : tensor<4x1x3200xf32> to tensor %7047 = torch_c.to_builtin_tensor %219 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %7048 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_9211, %7047) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_9212 = tensor.cast %7048 : tensor to tensor<4x1x3200xf32> %7049 = torch_c.from_builtin_tensor %cast_9212 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %7050 = torch_c.to_builtin_tensor %7045 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9213 = tensor.cast %7050 : tensor<4x1x3200xf32> to tensor %7051 = torch_c.to_builtin_tensor %220 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %7052 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_9213, %7051) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_9214 = tensor.cast %7052 : tensor to tensor<4x1x3200xf32> %7053 = torch_c.from_builtin_tensor %cast_9214 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %7054 = torch_c.to_builtin_tensor %7045 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9215 = tensor.cast %7054 : tensor<4x1x3200xf32> to tensor %7055 = torch_c.to_builtin_tensor %221 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %7056 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_9215, %7055) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_9216 = tensor.cast %7056 : tensor to tensor<4x1x3200xf32> %7057 = torch_c.from_builtin_tensor %cast_9216 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_9217 = torch.constant.int 4 %int1_9218 = torch.constant.int 1 %int32_9219 = torch.constant.int 32 %int100_9220 = torch.constant.int 100 %7058 = torch.prim.ListConstruct %int4_9217, %int1_9218, %int32_9219, %int100_9220 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7059 = torch.aten.view %7049, %7058 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_9221 = torch.constant.int 4 %int1_9222 = torch.constant.int 1 %int32_9223 = torch.constant.int 32 %int100_9224 = torch.constant.int 100 %7060 = torch.prim.ListConstruct %int4_9221, %int1_9222, %int32_9223, %int100_9224 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7061 = torch.aten.view %7053, %7060 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_9225 = torch.constant.int 4 %int1_9226 = torch.constant.int 1 %int32_9227 = torch.constant.int 32 %int100_9228 = torch.constant.int 100 %7062 = torch.prim.ListConstruct %int4_9225, %int1_9226, %int32_9227, %int100_9228 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7063 = torch.aten.view %7057, %7062 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_9229 = torch.constant.int 4 %int1_9230 = torch.constant.int 1 %int32_9231 = torch.constant.int 32 %int-1_9232 = torch.constant.int -1 %int2_9233 = torch.constant.int 2 %7064 = torch.prim.ListConstruct %int4_9229, %int1_9230, %int32_9231, %int-1_9232, %int2_9233 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7065 = torch.aten.view %7059, %7064 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %7066 = torch.aten.view_as_complex %7065 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_9234 = torch.constant.int 4 %int1_9235 = torch.constant.int 1 %int32_9236 = torch.constant.int 32 %int-1_9237 = torch.constant.int -1 %int2_9238 = torch.constant.int 2 %7067 = torch.prim.ListConstruct %int4_9234, %int1_9235, %int32_9236, %int-1_9237, %int2_9238 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7068 = torch.aten.view %7061, %7067 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %7069 = torch.aten.view_as_complex %7068 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %7070 = torch.aten.mul.Tensor %7066, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %7071 = torch.aten.view_as_real %7070 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_9239 = torch.constant.int 4 %int1_9240 = torch.constant.int 1 %int32_9241 = torch.constant.int 32 %int100_9242 = torch.constant.int 100 %7072 = torch.prim.ListConstruct %int4_9239, %int1_9240, %int32_9241, %int100_9242 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7073 = torch.aten.view %7071, %7072 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %7074 = torch.aten.mul.Tensor %7069, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %7075 = torch.aten.view_as_real %7074 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_9243 = torch.constant.int 4 %int1_9244 = torch.constant.int 1 %int32_9245 = torch.constant.int 32 %int100_9246 = torch.constant.int 100 %7076 = torch.prim.ListConstruct %int4_9243, %int1_9244, %int32_9245, %int100_9246 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7077 = torch.aten.view %7075, %7076 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_9247 = torch.constant.int 1 %int1_9248 = torch.constant.int 1 %7078 = torch.aten.add.Scalar %arg2, %int1_9247, %int1_9248 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_9249 = torch.constant.int 0 %int0_9250 = torch.constant.int 0 %7079 = torch.aten.select.int %7078, %int0_9249, %int0_9250 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_9251 = torch.constant.int 0 %int0_9252 = torch.constant.int 0 %7080 = torch.aten.select.int %arg3, %int0_9251, %int0_9252 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_9253 = torch.constant.int 0 %int0_9254 = torch.constant.int 0 %int9223372036854775807_9255 = torch.constant.int 9223372036854775807 %int1_9256 = torch.constant.int 1 %7081 = torch.aten.slice.Tensor %7080, %int0_9253, %int0_9254, %int9223372036854775807_9255, %int1_9256 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_9257 = torch.constant.int 16 %7082 = torch.aten.floor_divide.Scalar %7079, %int16_9257 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_9258 = torch.constant.int 0 %7083 = torch.aten.index_select %7081, %int0_9258, %7082 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_9259 = torch.constant.int 16 %7084 = torch.aten.remainder.Scalar %7079, %int16_9259 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_9260 = torch.constant.none %7085 = torch.aten.clone %622, %none_9260 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9261 = torch.constant.none %7086 = torch.aten.clone %623, %none_9261 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9262 = torch.constant.int 0 %7087 = torch.aten.unsqueeze %7084, %int0_9262 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9263 = torch.constant.int 0 %int0_9264 = torch.constant.int 0 %7088 = torch.aten.select.int %7077, %int0_9263, %int0_9264 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9265 = torch.constant.int 0 %int0_9266 = torch.constant.int 0 %7089 = torch.aten.select.int %7088, %int0_9265, %int0_9266 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_9267 = torch.constant.int -1 %int26_9268 = torch.constant.int 26 %int2_9269 = torch.constant.int 2 %int16_9270 = torch.constant.int 16 %int32_9271 = torch.constant.int 32 %int100_9272 = torch.constant.int 100 %7090 = torch.prim.ListConstruct %int-1_9267, %int26_9268, %int2_9269, %int16_9270, %int32_9271, %int100_9272 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7091 = torch.aten.view %6925, %7090 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %7092 = torch.prim.ListConstruct %7083, %7085, %7086, %7087 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9273 = torch.constant.bool false %7093 = torch.aten.index_put %7091, %7092, %7089, %false_9273 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9274 = torch.constant.int 2662400 %7094 = torch.prim.ListConstruct %731, %int2662400_9274 : (!torch.int, !torch.int) -> !torch.list %7095 = torch.aten.view %7093, %7094 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9275 = torch.constant.int -1 %int26_9276 = torch.constant.int 26 %int2_9277 = torch.constant.int 2 %int16_9278 = torch.constant.int 16 %int32_9279 = torch.constant.int 32 %int100_9280 = torch.constant.int 100 %7096 = torch.prim.ListConstruct %int-1_9275, %int26_9276, %int2_9277, %int16_9278, %int32_9279, %int100_9280 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7097 = torch.aten.view %7095, %7096 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_9281 = torch.constant.none %7098 = torch.aten.clone %624, %none_9281 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9282 = torch.constant.none %7099 = torch.aten.clone %625, %none_9282 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9283 = torch.constant.int 0 %7100 = torch.aten.unsqueeze %7084, %int0_9283 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9284 = torch.constant.int 0 %int0_9285 = torch.constant.int 0 %7101 = torch.aten.select.int %7063, %int0_9284, %int0_9285 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9286 = torch.constant.int 0 %int0_9287 = torch.constant.int 0 %7102 = torch.aten.select.int %7101, %int0_9286, %int0_9287 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7103 = torch.prim.ListConstruct %7083, %7098, %7099, %7100 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9288 = torch.constant.bool false %7104 = torch.aten.index_put %7097, %7103, %7102, %false_9288 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9289 = torch.constant.int 2662400 %7105 = torch.prim.ListConstruct %731, %int2662400_9289 : (!torch.int, !torch.int) -> !torch.list %7106 = torch.aten.view %7104, %7105 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9290 = torch.constant.int -1 %int26_9291 = torch.constant.int 26 %int2_9292 = torch.constant.int 2 %int16_9293 = torch.constant.int 16 %int32_9294 = torch.constant.int 32 %int100_9295 = torch.constant.int 100 %7107 = torch.prim.ListConstruct %int-1_9290, %int26_9291, %int2_9292, %int16_9293, %int32_9294, %int100_9295 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7108 = torch.aten.view %7106, %7107 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_9296 = torch.constant.int 0 %int1_9297 = torch.constant.int 1 %7109 = torch.aten.select.int %7078, %int0_9296, %int1_9297 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_9298 = torch.constant.int 0 %int1_9299 = torch.constant.int 1 %7110 = torch.aten.select.int %arg3, %int0_9298, %int1_9299 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_9300 = torch.constant.int 0 %int0_9301 = torch.constant.int 0 %int9223372036854775807_9302 = torch.constant.int 9223372036854775807 %int1_9303 = torch.constant.int 1 %7111 = torch.aten.slice.Tensor %7110, %int0_9300, %int0_9301, %int9223372036854775807_9302, %int1_9303 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_9304 = torch.constant.int 16 %7112 = torch.aten.floor_divide.Scalar %7109, %int16_9304 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_9305 = torch.constant.int 0 %7113 = torch.aten.index_select %7111, %int0_9305, %7112 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_9306 = torch.constant.int 16 %7114 = torch.aten.remainder.Scalar %7109, %int16_9306 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_9307 = torch.constant.none %7115 = torch.aten.clone %626, %none_9307 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9308 = torch.constant.none %7116 = torch.aten.clone %627, %none_9308 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9309 = torch.constant.int 0 %7117 = torch.aten.unsqueeze %7114, %int0_9309 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9310 = torch.constant.int 0 %int1_9311 = torch.constant.int 1 %7118 = torch.aten.select.int %7077, %int0_9310, %int1_9311 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9312 = torch.constant.int 0 %int0_9313 = torch.constant.int 0 %7119 = torch.aten.select.int %7118, %int0_9312, %int0_9313 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7120 = torch.prim.ListConstruct %7113, %7115, %7116, %7117 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9314 = torch.constant.bool false %7121 = torch.aten.index_put %7108, %7120, %7119, %false_9314 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9315 = torch.constant.int 2662400 %7122 = torch.prim.ListConstruct %731, %int2662400_9315 : (!torch.int, !torch.int) -> !torch.list %7123 = torch.aten.view %7121, %7122 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9316 = torch.constant.int -1 %int26_9317 = torch.constant.int 26 %int2_9318 = torch.constant.int 2 %int16_9319 = torch.constant.int 16 %int32_9320 = torch.constant.int 32 %int100_9321 = torch.constant.int 100 %7124 = torch.prim.ListConstruct %int-1_9316, %int26_9317, %int2_9318, %int16_9319, %int32_9320, %int100_9321 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7125 = torch.aten.view %7123, %7124 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_9322 = torch.constant.none %7126 = torch.aten.clone %628, %none_9322 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9323 = torch.constant.none %7127 = torch.aten.clone %629, %none_9323 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9324 = torch.constant.int 0 %7128 = torch.aten.unsqueeze %7114, %int0_9324 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9325 = torch.constant.int 0 %int1_9326 = torch.constant.int 1 %7129 = torch.aten.select.int %7063, %int0_9325, %int1_9326 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9327 = torch.constant.int 0 %int0_9328 = torch.constant.int 0 %7130 = torch.aten.select.int %7129, %int0_9327, %int0_9328 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7131 = torch.prim.ListConstruct %7113, %7126, %7127, %7128 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9329 = torch.constant.bool false %7132 = torch.aten.index_put %7125, %7131, %7130, %false_9329 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9330 = torch.constant.int 2662400 %7133 = torch.prim.ListConstruct %731, %int2662400_9330 : (!torch.int, !torch.int) -> !torch.list %7134 = torch.aten.view %7132, %7133 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9331 = torch.constant.int -1 %int26_9332 = torch.constant.int 26 %int2_9333 = torch.constant.int 2 %int16_9334 = torch.constant.int 16 %int32_9335 = torch.constant.int 32 %int100_9336 = torch.constant.int 100 %7135 = torch.prim.ListConstruct %int-1_9331, %int26_9332, %int2_9333, %int16_9334, %int32_9335, %int100_9336 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7136 = torch.aten.view %7134, %7135 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_9337 = torch.constant.int 0 %int2_9338 = torch.constant.int 2 %7137 = torch.aten.select.int %7078, %int0_9337, %int2_9338 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_9339 = torch.constant.int 0 %int2_9340 = torch.constant.int 2 %7138 = torch.aten.select.int %arg3, %int0_9339, %int2_9340 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_9341 = torch.constant.int 0 %int0_9342 = torch.constant.int 0 %int9223372036854775807_9343 = torch.constant.int 9223372036854775807 %int1_9344 = torch.constant.int 1 %7139 = torch.aten.slice.Tensor %7138, %int0_9341, %int0_9342, %int9223372036854775807_9343, %int1_9344 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_9345 = torch.constant.int 16 %7140 = torch.aten.floor_divide.Scalar %7137, %int16_9345 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_9346 = torch.constant.int 0 %7141 = torch.aten.index_select %7139, %int0_9346, %7140 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_9347 = torch.constant.int 16 %7142 = torch.aten.remainder.Scalar %7137, %int16_9347 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_9348 = torch.constant.none %7143 = torch.aten.clone %630, %none_9348 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9349 = torch.constant.none %7144 = torch.aten.clone %631, %none_9349 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9350 = torch.constant.int 0 %7145 = torch.aten.unsqueeze %7142, %int0_9350 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9351 = torch.constant.int 0 %int2_9352 = torch.constant.int 2 %7146 = torch.aten.select.int %7077, %int0_9351, %int2_9352 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9353 = torch.constant.int 0 %int0_9354 = torch.constant.int 0 %7147 = torch.aten.select.int %7146, %int0_9353, %int0_9354 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7148 = torch.prim.ListConstruct %7141, %7143, %7144, %7145 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9355 = torch.constant.bool false %7149 = torch.aten.index_put %7136, %7148, %7147, %false_9355 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9356 = torch.constant.int 2662400 %7150 = torch.prim.ListConstruct %731, %int2662400_9356 : (!torch.int, !torch.int) -> !torch.list %7151 = torch.aten.view %7149, %7150 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9357 = torch.constant.int -1 %int26_9358 = torch.constant.int 26 %int2_9359 = torch.constant.int 2 %int16_9360 = torch.constant.int 16 %int32_9361 = torch.constant.int 32 %int100_9362 = torch.constant.int 100 %7152 = torch.prim.ListConstruct %int-1_9357, %int26_9358, %int2_9359, %int16_9360, %int32_9361, %int100_9362 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7153 = torch.aten.view %7151, %7152 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_9363 = torch.constant.none %7154 = torch.aten.clone %632, %none_9363 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9364 = torch.constant.none %7155 = torch.aten.clone %633, %none_9364 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9365 = torch.constant.int 0 %7156 = torch.aten.unsqueeze %7142, %int0_9365 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9366 = torch.constant.int 0 %int2_9367 = torch.constant.int 2 %7157 = torch.aten.select.int %7063, %int0_9366, %int2_9367 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9368 = torch.constant.int 0 %int0_9369 = torch.constant.int 0 %7158 = torch.aten.select.int %7157, %int0_9368, %int0_9369 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7159 = torch.prim.ListConstruct %7141, %7154, %7155, %7156 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9370 = torch.constant.bool false %7160 = torch.aten.index_put %7153, %7159, %7158, %false_9370 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9371 = torch.constant.int 2662400 %7161 = torch.prim.ListConstruct %731, %int2662400_9371 : (!torch.int, !torch.int) -> !torch.list %7162 = torch.aten.view %7160, %7161 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9372 = torch.constant.int -1 %int26_9373 = torch.constant.int 26 %int2_9374 = torch.constant.int 2 %int16_9375 = torch.constant.int 16 %int32_9376 = torch.constant.int 32 %int100_9377 = torch.constant.int 100 %7163 = torch.prim.ListConstruct %int-1_9372, %int26_9373, %int2_9374, %int16_9375, %int32_9376, %int100_9377 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7164 = torch.aten.view %7162, %7163 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_9378 = torch.constant.int 0 %int3_9379 = torch.constant.int 3 %7165 = torch.aten.select.int %7078, %int0_9378, %int3_9379 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_9380 = torch.constant.int 0 %int3_9381 = torch.constant.int 3 %7166 = torch.aten.select.int %arg3, %int0_9380, %int3_9381 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_9382 = torch.constant.int 0 %int0_9383 = torch.constant.int 0 %int9223372036854775807_9384 = torch.constant.int 9223372036854775807 %int1_9385 = torch.constant.int 1 %7167 = torch.aten.slice.Tensor %7166, %int0_9382, %int0_9383, %int9223372036854775807_9384, %int1_9385 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_9386 = torch.constant.int 16 %7168 = torch.aten.floor_divide.Scalar %7165, %int16_9386 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_9387 = torch.constant.int 0 %7169 = torch.aten.index_select %7167, %int0_9387, %7168 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_9388 = torch.constant.int 16 %7170 = torch.aten.remainder.Scalar %7165, %int16_9388 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_9389 = torch.constant.none %7171 = torch.aten.clone %634, %none_9389 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9390 = torch.constant.none %7172 = torch.aten.clone %635, %none_9390 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9391 = torch.constant.int 0 %7173 = torch.aten.unsqueeze %7170, %int0_9391 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9392 = torch.constant.int 0 %int3_9393 = torch.constant.int 3 %7174 = torch.aten.select.int %7077, %int0_9392, %int3_9393 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9394 = torch.constant.int 0 %int0_9395 = torch.constant.int 0 %7175 = torch.aten.select.int %7174, %int0_9394, %int0_9395 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7176 = torch.prim.ListConstruct %7169, %7171, %7172, %7173 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9396 = torch.constant.bool false %7177 = torch.aten.index_put %7164, %7176, %7175, %false_9396 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9397 = torch.constant.int 2662400 %7178 = torch.prim.ListConstruct %731, %int2662400_9397 : (!torch.int, !torch.int) -> !torch.list %7179 = torch.aten.view %7177, %7178 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9398 = torch.constant.int -1 %int26_9399 = torch.constant.int 26 %int2_9400 = torch.constant.int 2 %int16_9401 = torch.constant.int 16 %int32_9402 = torch.constant.int 32 %int100_9403 = torch.constant.int 100 %7180 = torch.prim.ListConstruct %int-1_9398, %int26_9399, %int2_9400, %int16_9401, %int32_9402, %int100_9403 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7181 = torch.aten.view %7179, %7180 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_9404 = torch.constant.none %7182 = torch.aten.clone %636, %none_9404 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9405 = torch.constant.none %7183 = torch.aten.clone %637, %none_9405 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9406 = torch.constant.int 0 %7184 = torch.aten.unsqueeze %7170, %int0_9406 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9407 = torch.constant.int 0 %int3_9408 = torch.constant.int 3 %7185 = torch.aten.select.int %7063, %int0_9407, %int3_9408 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9409 = torch.constant.int 0 %int0_9410 = torch.constant.int 0 %7186 = torch.aten.select.int %7185, %int0_9409, %int0_9410 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7187 = torch.prim.ListConstruct %7169, %7182, %7183, %7184 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9411 = torch.constant.bool false %7188 = torch.aten.index_put %7181, %7187, %7186, %false_9411 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9412 = torch.constant.int 2662400 %7189 = torch.prim.ListConstruct %731, %int2662400_9412 : (!torch.int, !torch.int) -> !torch.list %7190 = torch.aten.view %7188, %7189 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int52_9413 = torch.constant.int 52 %7191 = torch.aten.mul.Scalar %arg3, %int52_9413 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int48 = torch.constant.int 48 %int1_9414 = torch.constant.int 1 %7192 = torch.aten.add.Scalar %7191, %int48, %int1_9414 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_9415 = torch.constant.int 4 %7193 = torch.aten.mul.int %int4_9415, %655 : !torch.int, !torch.int -> !torch.int %7194 = torch.prim.ListConstruct %7193 : (!torch.int) -> !torch.list %7195 = torch.aten.view %7192, %7194 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_9416 = torch.constant.int -1 %int26_9417 = torch.constant.int 26 %int2_9418 = torch.constant.int 2 %int16_9419 = torch.constant.int 16 %int32_9420 = torch.constant.int 32 %int100_9421 = torch.constant.int 100 %7196 = torch.prim.ListConstruct %int-1_9416, %int26_9417, %int2_9418, %int16_9419, %int32_9420, %int100_9421 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7197 = torch.aten.view %7190, %7196 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_9422 = torch.constant.int 26 %7198 = torch.aten.mul.int %731, %int26_9422 : !torch.int, !torch.int -> !torch.int %int2_9423 = torch.constant.int 2 %7199 = torch.aten.mul.int %7198, %int2_9423 : !torch.int, !torch.int -> !torch.int %int16_9424 = torch.constant.int 16 %int32_9425 = torch.constant.int 32 %int100_9426 = torch.constant.int 100 %7200 = torch.prim.ListConstruct %7199, %int16_9424, %int32_9425, %int100_9426 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7201 = torch.aten.view %7197, %7200 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_9427 = torch.constant.int 0 %7202 = torch.aten.index_select %7201, %int0_9427, %7195 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_9428 = torch.constant.int 4 %int16_9429 = torch.constant.int 16 %int32_9430 = torch.constant.int 32 %int100_9431 = torch.constant.int 100 %7203 = torch.prim.ListConstruct %int4_9428, %655, %int16_9429, %int32_9430, %int100_9431 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7204 = torch.aten.view %7202, %7203 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_9432 = torch.constant.int 1 %7205 = torch.aten.size.int %7204, %int1_9432 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_9433 = torch.constant.int 16 %7206 = torch.aten.mul.int %7205, %int16_9433 : !torch.int, !torch.int -> !torch.int %int4_9434 = torch.constant.int 4 %int32_9435 = torch.constant.int 32 %int100_9436 = torch.constant.int 100 %7207 = torch.prim.ListConstruct %int4_9434, %7206, %int32_9435, %int100_9436 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7208 = torch.aten.view %7204, %7207 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_9437 = torch.constant.int 0 %int0_9438 = torch.constant.int 0 %int9223372036854775807_9439 = torch.constant.int 9223372036854775807 %int1_9440 = torch.constant.int 1 %7209 = torch.aten.slice.Tensor %6950, %int0_9437, %int0_9438, %int9223372036854775807_9439, %int1_9440 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_9441 = torch.constant.int 16 %7210 = torch.aten.mul.int %655, %int16_9441 : !torch.int, !torch.int -> !torch.int %int1_9442 = torch.constant.int 1 %int0_9443 = torch.constant.int 0 %int1_9444 = torch.constant.int 1 %7211 = torch.aten.slice.Tensor %7209, %int1_9442, %int0_9443, %7210, %int1_9444 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_9445 = torch.constant.bool false %7212 = torch.aten.copy %7211, %7208, %false_9445 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_9446 = torch.constant.int 0 %int0_9447 = torch.constant.int 0 %int9223372036854775807_9448 = torch.constant.int 9223372036854775807 %int1_9449 = torch.constant.int 1 %7213 = torch.aten.slice.Tensor %6950, %int0_9446, %int0_9447, %int9223372036854775807_9448, %int1_9449 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9450 = torch.constant.int 1 %int0_9451 = torch.constant.int 0 %int1_9452 = torch.constant.int 1 %7214 = torch.aten.slice_scatter %7213, %7212, %int1_9450, %int0_9451, %7210, %int1_9452 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_9453 = torch.constant.int 0 %int0_9454 = torch.constant.int 0 %int9223372036854775807_9455 = torch.constant.int 9223372036854775807 %int1_9456 = torch.constant.int 1 %7215 = torch.aten.slice_scatter %6950, %7214, %int0_9453, %int0_9454, %int9223372036854775807_9455, %int1_9456 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9457 = torch.constant.int 1 %int1_9458 = torch.constant.int 1 %7216 = torch.aten.add.Scalar %7192, %int1_9457, %int1_9458 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_9459 = torch.constant.int 4 %7217 = torch.aten.mul.int %int4_9459, %655 : !torch.int, !torch.int -> !torch.int %7218 = torch.prim.ListConstruct %7217 : (!torch.int) -> !torch.list %7219 = torch.aten.view %7216, %7218 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_9460 = torch.constant.int 0 %7220 = torch.aten.index_select %7201, %int0_9460, %7219 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_9461 = torch.constant.int 4 %int16_9462 = torch.constant.int 16 %int32_9463 = torch.constant.int 32 %int100_9464 = torch.constant.int 100 %7221 = torch.prim.ListConstruct %int4_9461, %655, %int16_9462, %int32_9463, %int100_9464 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7222 = torch.aten.view %7220, %7221 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_9465 = torch.constant.int 1 %7223 = torch.aten.size.int %7222, %int1_9465 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_9466 = torch.constant.int 16 %7224 = torch.aten.mul.int %7223, %int16_9466 : !torch.int, !torch.int -> !torch.int %int4_9467 = torch.constant.int 4 %int32_9468 = torch.constant.int 32 %int100_9469 = torch.constant.int 100 %7225 = torch.prim.ListConstruct %int4_9467, %7224, %int32_9468, %int100_9469 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7226 = torch.aten.view %7222, %7225 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_9470 = torch.constant.int 0 %int0_9471 = torch.constant.int 0 %int9223372036854775807_9472 = torch.constant.int 9223372036854775807 %int1_9473 = torch.constant.int 1 %7227 = torch.aten.slice.Tensor %6967, %int0_9470, %int0_9471, %int9223372036854775807_9472, %int1_9473 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9474 = torch.constant.int 1 %int0_9475 = torch.constant.int 0 %int1_9476 = torch.constant.int 1 %7228 = torch.aten.slice.Tensor %7227, %int1_9474, %int0_9475, %7210, %int1_9476 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_9477 = torch.constant.bool false %7229 = torch.aten.copy %7228, %7226, %false_9477 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_9478 = torch.constant.int 0 %int0_9479 = torch.constant.int 0 %int9223372036854775807_9480 = torch.constant.int 9223372036854775807 %int1_9481 = torch.constant.int 1 %7230 = torch.aten.slice.Tensor %6967, %int0_9478, %int0_9479, %int9223372036854775807_9480, %int1_9481 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9482 = torch.constant.int 1 %int0_9483 = torch.constant.int 0 %int1_9484 = torch.constant.int 1 %7231 = torch.aten.slice_scatter %7230, %7229, %int1_9482, %int0_9483, %7210, %int1_9484 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_9485 = torch.constant.int 0 %int0_9486 = torch.constant.int 0 %int9223372036854775807_9487 = torch.constant.int 9223372036854775807 %int1_9488 = torch.constant.int 1 %7232 = torch.aten.slice_scatter %6967, %7231, %int0_9485, %int0_9486, %int9223372036854775807_9487, %int1_9488 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_9489 = torch.constant.int 0 %int0_9490 = torch.constant.int 0 %int9223372036854775807_9491 = torch.constant.int 9223372036854775807 %int1_9492 = torch.constant.int 1 %7233 = torch.aten.slice.Tensor %671, %int0_9489, %int0_9490, %int9223372036854775807_9491, %int1_9492 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9493 = torch.constant.int 1 %int0_9494 = torch.constant.int 0 %int1_9495 = torch.constant.int 1 %7234 = torch.aten.slice.Tensor %7233, %int1_9493, %int0_9494, %7210, %int1_9495 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_9496 = torch.constant.int 0 %int0_9497 = torch.constant.int 0 %int9223372036854775807_9498 = torch.constant.int 9223372036854775807 %int1_9499 = torch.constant.int 1 %7235 = torch.aten.slice.Tensor %673, %int0_9496, %int0_9497, %int9223372036854775807_9498, %int1_9499 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9500 = torch.constant.int 1 %int0_9501 = torch.constant.int 0 %int1_9502 = torch.constant.int 1 %7236 = torch.aten.slice.Tensor %7235, %int1_9500, %int0_9501, %7210, %int1_9502 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_9503 = torch.constant.int 1 %int2_9504 = torch.constant.int 2 %7237 = torch.aten.transpose.int %7073, %int1_9503, %int2_9504 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_9505 = torch.constant.int 4 %int32_9506 = torch.constant.int 32 %int1_9507 = torch.constant.int 1 %int100_9508 = torch.constant.int 100 %7238 = torch.prim.ListConstruct %int4_9505, %int32_9506, %int1_9507, %int100_9508 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9509 = torch.constant.bool false %7239 = torch.aten.expand %7237, %7238, %false_9509 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_9510 = torch.constant.int 128 %int1_9511 = torch.constant.int 1 %int100_9512 = torch.constant.int 100 %7240 = torch.prim.ListConstruct %int128_9510, %int1_9511, %int100_9512 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7241 = torch.aten.view %7239, %7240 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_9513 = torch.constant.int 0 %int0_9514 = torch.constant.int 0 %int9223372036854775807_9515 = torch.constant.int 9223372036854775807 %int1_9516 = torch.constant.int 1 %7242 = torch.aten.slice.Tensor %7215, %int0_9513, %int0_9514, %int9223372036854775807_9515, %int1_9516 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9517 = torch.constant.int 1 %int0_9518 = torch.constant.int 0 %int1_9519 = torch.constant.int 1 %7243 = torch.aten.slice.Tensor %7242, %int1_9517, %int0_9518, %7210, %int1_9519 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_9520 = torch.constant.int 1 %int2_9521 = torch.constant.int 2 %7244 = torch.aten.transpose.int %7243, %int1_9520, %int2_9521 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_9522 = torch.constant.int 2 %int3_9523 = torch.constant.int 3 %7245 = torch.aten.transpose.int %7244, %int2_9522, %int3_9523 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_9524 = torch.constant.int 1 %7246 = torch.aten.size.int %7234, %int1_9524 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_9525 = torch.constant.int 4 %int32_9526 = torch.constant.int 32 %int100_9527 = torch.constant.int 100 %7247 = torch.prim.ListConstruct %int4_9525, %int32_9526, %int100_9527, %7246 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9528 = torch.constant.bool false %7248 = torch.aten.expand %7245, %7247, %false_9528 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_9529 = torch.constant.int 0 %7249 = torch.aten.clone %7248, %int0_9529 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_9530 = torch.constant.int 128 %int100_9531 = torch.constant.int 100 %7250 = torch.prim.ListConstruct %int128_9530, %int100_9531, %7246 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7251 = torch.aten._unsafe_view %7249, %7250 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %7252 = torch.aten.bmm %7241, %7251 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_9532 = torch.constant.int 4 %int32_9533 = torch.constant.int 32 %int1_9534 = torch.constant.int 1 %7253 = torch.prim.ListConstruct %int4_9532, %int32_9533, %int1_9534, %7246 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7254 = torch.aten.view %7252, %7253 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_9535 = torch.constant.float 1.000000e+01 %7255 = torch.aten.div.Scalar %7254, %float1.000000e01_9535 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_9536 = torch.constant.int 1 %7256 = torch.aten.add.Tensor %7255, %895, %int1_9536 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_9537 = torch.constant.int -1 %false_9538 = torch.constant.bool false %7257 = torch.aten._softmax %7256, %int-1_9537, %false_9538 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_9539 = torch.constant.int 4 %int32_9540 = torch.constant.int 32 %int1_9541 = torch.constant.int 1 %7258 = torch.prim.ListConstruct %int4_9539, %int32_9540, %int1_9541, %7246 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9542 = torch.constant.bool false %7259 = torch.aten.expand %7257, %7258, %false_9542 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_9543 = torch.constant.int 128 %int1_9544 = torch.constant.int 1 %7260 = torch.prim.ListConstruct %int128_9543, %int1_9544, %7246 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7261 = torch.aten.view %7259, %7260 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_9545 = torch.constant.int 0 %int0_9546 = torch.constant.int 0 %int9223372036854775807_9547 = torch.constant.int 9223372036854775807 %int1_9548 = torch.constant.int 1 %7262 = torch.aten.slice.Tensor %7232, %int0_9545, %int0_9546, %int9223372036854775807_9547, %int1_9548 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9549 = torch.constant.int 1 %int0_9550 = torch.constant.int 0 %int1_9551 = torch.constant.int 1 %7263 = torch.aten.slice.Tensor %7262, %int1_9549, %int0_9550, %7210, %int1_9551 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_9552 = torch.constant.int 1 %int2_9553 = torch.constant.int 2 %7264 = torch.aten.transpose.int %7263, %int1_9552, %int2_9553 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_9554 = torch.constant.int 1 %7265 = torch.aten.size.int %7236, %int1_9554 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_9555 = torch.constant.int 4 %int32_9556 = torch.constant.int 32 %int100_9557 = torch.constant.int 100 %7266 = torch.prim.ListConstruct %int4_9555, %int32_9556, %7265, %int100_9557 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9558 = torch.constant.bool false %7267 = torch.aten.expand %7264, %7266, %false_9558 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_9559 = torch.constant.int 0 %7268 = torch.aten.clone %7267, %int0_9559 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_9560 = torch.constant.int 128 %int100_9561 = torch.constant.int 100 %7269 = torch.prim.ListConstruct %int128_9560, %7265, %int100_9561 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7270 = torch.aten._unsafe_view %7268, %7269 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %7271 = torch.aten.bmm %7261, %7270 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_9562 = torch.constant.int 4 %int32_9563 = torch.constant.int 32 %int1_9564 = torch.constant.int 1 %int100_9565 = torch.constant.int 100 %7272 = torch.prim.ListConstruct %int4_9562, %int32_9563, %int1_9564, %int100_9565 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7273 = torch.aten.view %7271, %7272 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_9566 = torch.constant.int 1 %int2_9567 = torch.constant.int 2 %7274 = torch.aten.transpose.int %7273, %int1_9566, %int2_9567 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_9568 = torch.constant.int 4 %int1_9569 = torch.constant.int 1 %int-1_9570 = torch.constant.int -1 %7275 = torch.prim.ListConstruct %int4_9568, %int1_9569, %int-1_9570 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7276 = torch.aten.view %7274, %7275 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %7277 = torch_c.to_builtin_tensor %7276 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9571 = tensor.cast %7277 : tensor<4x1x3200xf32> to tensor %7278 = torch_c.to_builtin_tensor %222 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %7279 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_9571, %7278) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_9572 = tensor.cast %7279 : tensor to tensor<4x1x3200xf32> %7280 = torch_c.from_builtin_tensor %cast_9572 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_9573 = torch.constant.int 1 %7281 = torch.aten.add.Tensor %7038, %7280, %int1_9573 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_9574 = torch.constant.int 2 %7282 = torch.aten.pow.Tensor_Scalar %7281, %int2_9574 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_9575 = torch.constant.int -1 %7283 = torch.prim.ListConstruct %int-1_9575 : (!torch.int) -> !torch.list %true_9576 = torch.constant.bool true %none_9577 = torch.constant.none %7284 = torch.aten.mean.dim %7282, %7283, %true_9576, %none_9577 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_9578 = torch.constant.float 9.9999999747524271E-7 %int1_9579 = torch.constant.int 1 %7285 = torch.aten.add.Scalar %7284, %float9.999990e-07_9578, %int1_9579 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %7286 = torch.aten.rsqrt %7285 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %7287 = torch.aten.mul.Tensor %7281, %7286 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %7288 = torch.aten.mul.Tensor %7287, %223 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %7289 = torch_c.to_builtin_tensor %7288 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9580 = tensor.cast %7289 : tensor<4x1x3200xf32> to tensor %7290 = torch_c.to_builtin_tensor %224 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %7291 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_9580, %7290) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_9581 = tensor.cast %7291 : tensor to tensor<4x1x8640xf32> %7292 = torch_c.from_builtin_tensor %cast_9581 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %7293 = torch.aten.silu %7292 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %7294 = torch_c.to_builtin_tensor %7288 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9582 = tensor.cast %7294 : tensor<4x1x3200xf32> to tensor %7295 = torch_c.to_builtin_tensor %225 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %7296 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_9582, %7295) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_9583 = tensor.cast %7296 : tensor to tensor<4x1x8640xf32> %7297 = torch_c.from_builtin_tensor %cast_9583 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %7298 = torch.aten.mul.Tensor %7293, %7297 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %7299 = torch_c.to_builtin_tensor %7298 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_9584 = tensor.cast %7299 : tensor<4x1x8640xf32> to tensor %7300 = torch_c.to_builtin_tensor %226 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %7301 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_9584, %7300) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_9585 = tensor.cast %7301 : tensor to tensor<4x1x3200xf32> %7302 = torch_c.from_builtin_tensor %cast_9585 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_9586 = torch.constant.int 1 %7303 = torch.aten.add.Tensor %7281, %7302, %int1_9586 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_9587 = torch.constant.int 2 %7304 = torch.aten.pow.Tensor_Scalar %7303, %int2_9587 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_9588 = torch.constant.int -1 %7305 = torch.prim.ListConstruct %int-1_9588 : (!torch.int) -> !torch.list %true_9589 = torch.constant.bool true %none_9590 = torch.constant.none %7306 = torch.aten.mean.dim %7304, %7305, %true_9589, %none_9590 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_9591 = torch.constant.float 9.9999999747524271E-7 %int1_9592 = torch.constant.int 1 %7307 = torch.aten.add.Scalar %7306, %float9.999990e-07_9591, %int1_9592 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %7308 = torch.aten.rsqrt %7307 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %7309 = torch.aten.mul.Tensor %7303, %7308 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %7310 = torch.aten.mul.Tensor %7309, %227 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %7311 = torch_c.to_builtin_tensor %7310 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9593 = tensor.cast %7311 : tensor<4x1x3200xf32> to tensor %7312 = torch_c.to_builtin_tensor %228 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %7313 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_9593, %7312) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_9594 = tensor.cast %7313 : tensor to tensor<4x1x3200xf32> %7314 = torch_c.from_builtin_tensor %cast_9594 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %7315 = torch_c.to_builtin_tensor %7310 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9595 = tensor.cast %7315 : tensor<4x1x3200xf32> to tensor %7316 = torch_c.to_builtin_tensor %229 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %7317 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_9595, %7316) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_9596 = tensor.cast %7317 : tensor to tensor<4x1x3200xf32> %7318 = torch_c.from_builtin_tensor %cast_9596 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %7319 = torch_c.to_builtin_tensor %7310 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9597 = tensor.cast %7319 : tensor<4x1x3200xf32> to tensor %7320 = torch_c.to_builtin_tensor %230 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %7321 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_9597, %7320) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_9598 = tensor.cast %7321 : tensor to tensor<4x1x3200xf32> %7322 = torch_c.from_builtin_tensor %cast_9598 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int4_9599 = torch.constant.int 4 %int1_9600 = torch.constant.int 1 %int32_9601 = torch.constant.int 32 %int100_9602 = torch.constant.int 100 %7323 = torch.prim.ListConstruct %int4_9599, %int1_9600, %int32_9601, %int100_9602 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7324 = torch.aten.view %7314, %7323 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_9603 = torch.constant.int 4 %int1_9604 = torch.constant.int 1 %int32_9605 = torch.constant.int 32 %int100_9606 = torch.constant.int 100 %7325 = torch.prim.ListConstruct %int4_9603, %int1_9604, %int32_9605, %int100_9606 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7326 = torch.aten.view %7318, %7325 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_9607 = torch.constant.int 4 %int1_9608 = torch.constant.int 1 %int32_9609 = torch.constant.int 32 %int100_9610 = torch.constant.int 100 %7327 = torch.prim.ListConstruct %int4_9607, %int1_9608, %int32_9609, %int100_9610 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7328 = torch.aten.view %7322, %7327 : !torch.vtensor<[4,1,3200],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int4_9611 = torch.constant.int 4 %int1_9612 = torch.constant.int 1 %int32_9613 = torch.constant.int 32 %int-1_9614 = torch.constant.int -1 %int2_9615 = torch.constant.int 2 %7329 = torch.prim.ListConstruct %int4_9611, %int1_9612, %int32_9613, %int-1_9614, %int2_9615 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7330 = torch.aten.view %7324, %7329 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %7331 = torch.aten.view_as_complex %7330 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %int4_9616 = torch.constant.int 4 %int1_9617 = torch.constant.int 1 %int32_9618 = torch.constant.int 32 %int-1_9619 = torch.constant.int -1 %int2_9620 = torch.constant.int 2 %7332 = torch.prim.ListConstruct %int4_9616, %int1_9617, %int32_9618, %int-1_9619, %int2_9620 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7333 = torch.aten.view %7326, %7332 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,32,50,2],f32> %7334 = torch.aten.view_as_complex %7333 : !torch.vtensor<[4,1,32,50,2],f32> -> !torch.vtensor<[4,1,32,50],complex> %7335 = torch.aten.mul.Tensor %7331, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %7336 = torch.aten.view_as_real %7335 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_9621 = torch.constant.int 4 %int1_9622 = torch.constant.int 1 %int32_9623 = torch.constant.int 32 %int100_9624 = torch.constant.int 100 %7337 = torch.prim.ListConstruct %int4_9621, %int1_9622, %int32_9623, %int100_9624 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7338 = torch.aten.view %7336, %7337 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %7339 = torch.aten.mul.Tensor %7334, %669 : !torch.vtensor<[4,1,32,50],complex>, !torch.vtensor<[4,1,1,50],complex> -> !torch.vtensor<[4,1,32,50],complex> %7340 = torch.aten.view_as_real %7339 : !torch.vtensor<[4,1,32,50],complex> -> !torch.vtensor<[4,1,32,50,2],f32> %int4_9625 = torch.constant.int 4 %int1_9626 = torch.constant.int 1 %int32_9627 = torch.constant.int 32 %int100_9628 = torch.constant.int 100 %7341 = torch.prim.ListConstruct %int4_9625, %int1_9626, %int32_9627, %int100_9628 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7342 = torch.aten.view %7340, %7341 : !torch.vtensor<[4,1,32,50,2],f32>, !torch.list -> !torch.vtensor<[4,1,32,100],f32> %int1_9629 = torch.constant.int 1 %int1_9630 = torch.constant.int 1 %7343 = torch.aten.add.Scalar %arg2, %int1_9629, %int1_9630 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[4],si64> %int0_9631 = torch.constant.int 0 %int0_9632 = torch.constant.int 0 %7344 = torch.aten.select.int %7343, %int0_9631, %int0_9632 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_9633 = torch.constant.int 0 %int0_9634 = torch.constant.int 0 %7345 = torch.aten.select.int %arg3, %int0_9633, %int0_9634 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_9635 = torch.constant.int 0 %int0_9636 = torch.constant.int 0 %int9223372036854775807_9637 = torch.constant.int 9223372036854775807 %int1_9638 = torch.constant.int 1 %7346 = torch.aten.slice.Tensor %7345, %int0_9635, %int0_9636, %int9223372036854775807_9637, %int1_9638 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_9639 = torch.constant.int 16 %7347 = torch.aten.floor_divide.Scalar %7344, %int16_9639 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_9640 = torch.constant.int 0 %7348 = torch.aten.index_select %7346, %int0_9640, %7347 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_9641 = torch.constant.int 16 %7349 = torch.aten.remainder.Scalar %7344, %int16_9641 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_9642 = torch.constant.none %7350 = torch.aten.clone %638, %none_9642 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9643 = torch.constant.none %7351 = torch.aten.clone %639, %none_9643 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9644 = torch.constant.int 0 %7352 = torch.aten.unsqueeze %7349, %int0_9644 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9645 = torch.constant.int 0 %int0_9646 = torch.constant.int 0 %7353 = torch.aten.select.int %7342, %int0_9645, %int0_9646 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9647 = torch.constant.int 0 %int0_9648 = torch.constant.int 0 %7354 = torch.aten.select.int %7353, %int0_9647, %int0_9648 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %int-1_9649 = torch.constant.int -1 %int26_9650 = torch.constant.int 26 %int2_9651 = torch.constant.int 2 %int16_9652 = torch.constant.int 16 %int32_9653 = torch.constant.int 32 %int100_9654 = torch.constant.int 100 %7355 = torch.prim.ListConstruct %int-1_9649, %int26_9650, %int2_9651, %int16_9652, %int32_9653, %int100_9654 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7356 = torch.aten.view %7190, %7355 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %7357 = torch.prim.ListConstruct %7348, %7350, %7351, %7352 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9655 = torch.constant.bool false %7358 = torch.aten.index_put %7356, %7357, %7354, %false_9655 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9656 = torch.constant.int 2662400 %7359 = torch.prim.ListConstruct %731, %int2662400_9656 : (!torch.int, !torch.int) -> !torch.list %7360 = torch.aten.view %7358, %7359 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9657 = torch.constant.int -1 %int26_9658 = torch.constant.int 26 %int2_9659 = torch.constant.int 2 %int16_9660 = torch.constant.int 16 %int32_9661 = torch.constant.int 32 %int100_9662 = torch.constant.int 100 %7361 = torch.prim.ListConstruct %int-1_9657, %int26_9658, %int2_9659, %int16_9660, %int32_9661, %int100_9662 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7362 = torch.aten.view %7360, %7361 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_9663 = torch.constant.none %7363 = torch.aten.clone %640, %none_9663 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9664 = torch.constant.none %7364 = torch.aten.clone %641, %none_9664 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9665 = torch.constant.int 0 %7365 = torch.aten.unsqueeze %7349, %int0_9665 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9666 = torch.constant.int 0 %int0_9667 = torch.constant.int 0 %7366 = torch.aten.select.int %7328, %int0_9666, %int0_9667 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9668 = torch.constant.int 0 %int0_9669 = torch.constant.int 0 %7367 = torch.aten.select.int %7366, %int0_9668, %int0_9669 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7368 = torch.prim.ListConstruct %7348, %7363, %7364, %7365 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9670 = torch.constant.bool false %7369 = torch.aten.index_put %7362, %7368, %7367, %false_9670 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9671 = torch.constant.int 2662400 %7370 = torch.prim.ListConstruct %731, %int2662400_9671 : (!torch.int, !torch.int) -> !torch.list %7371 = torch.aten.view %7369, %7370 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9672 = torch.constant.int -1 %int26_9673 = torch.constant.int 26 %int2_9674 = torch.constant.int 2 %int16_9675 = torch.constant.int 16 %int32_9676 = torch.constant.int 32 %int100_9677 = torch.constant.int 100 %7372 = torch.prim.ListConstruct %int-1_9672, %int26_9673, %int2_9674, %int16_9675, %int32_9676, %int100_9677 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7373 = torch.aten.view %7371, %7372 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_9678 = torch.constant.int 0 %int1_9679 = torch.constant.int 1 %7374 = torch.aten.select.int %7343, %int0_9678, %int1_9679 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_9680 = torch.constant.int 0 %int1_9681 = torch.constant.int 1 %7375 = torch.aten.select.int %arg3, %int0_9680, %int1_9681 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_9682 = torch.constant.int 0 %int0_9683 = torch.constant.int 0 %int9223372036854775807_9684 = torch.constant.int 9223372036854775807 %int1_9685 = torch.constant.int 1 %7376 = torch.aten.slice.Tensor %7375, %int0_9682, %int0_9683, %int9223372036854775807_9684, %int1_9685 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_9686 = torch.constant.int 16 %7377 = torch.aten.floor_divide.Scalar %7374, %int16_9686 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_9687 = torch.constant.int 0 %7378 = torch.aten.index_select %7376, %int0_9687, %7377 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_9688 = torch.constant.int 16 %7379 = torch.aten.remainder.Scalar %7374, %int16_9688 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_9689 = torch.constant.none %7380 = torch.aten.clone %642, %none_9689 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9690 = torch.constant.none %7381 = torch.aten.clone %643, %none_9690 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9691 = torch.constant.int 0 %7382 = torch.aten.unsqueeze %7379, %int0_9691 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9692 = torch.constant.int 0 %int1_9693 = torch.constant.int 1 %7383 = torch.aten.select.int %7342, %int0_9692, %int1_9693 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9694 = torch.constant.int 0 %int0_9695 = torch.constant.int 0 %7384 = torch.aten.select.int %7383, %int0_9694, %int0_9695 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7385 = torch.prim.ListConstruct %7378, %7380, %7381, %7382 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9696 = torch.constant.bool false %7386 = torch.aten.index_put %7373, %7385, %7384, %false_9696 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9697 = torch.constant.int 2662400 %7387 = torch.prim.ListConstruct %731, %int2662400_9697 : (!torch.int, !torch.int) -> !torch.list %7388 = torch.aten.view %7386, %7387 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9698 = torch.constant.int -1 %int26_9699 = torch.constant.int 26 %int2_9700 = torch.constant.int 2 %int16_9701 = torch.constant.int 16 %int32_9702 = torch.constant.int 32 %int100_9703 = torch.constant.int 100 %7389 = torch.prim.ListConstruct %int-1_9698, %int26_9699, %int2_9700, %int16_9701, %int32_9702, %int100_9703 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7390 = torch.aten.view %7388, %7389 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_9704 = torch.constant.none %7391 = torch.aten.clone %644, %none_9704 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9705 = torch.constant.none %7392 = torch.aten.clone %645, %none_9705 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9706 = torch.constant.int 0 %7393 = torch.aten.unsqueeze %7379, %int0_9706 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9707 = torch.constant.int 0 %int1_9708 = torch.constant.int 1 %7394 = torch.aten.select.int %7328, %int0_9707, %int1_9708 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9709 = torch.constant.int 0 %int0_9710 = torch.constant.int 0 %7395 = torch.aten.select.int %7394, %int0_9709, %int0_9710 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7396 = torch.prim.ListConstruct %7378, %7391, %7392, %7393 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9711 = torch.constant.bool false %7397 = torch.aten.index_put %7390, %7396, %7395, %false_9711 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9712 = torch.constant.int 2662400 %7398 = torch.prim.ListConstruct %731, %int2662400_9712 : (!torch.int, !torch.int) -> !torch.list %7399 = torch.aten.view %7397, %7398 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9713 = torch.constant.int -1 %int26_9714 = torch.constant.int 26 %int2_9715 = torch.constant.int 2 %int16_9716 = torch.constant.int 16 %int32_9717 = torch.constant.int 32 %int100_9718 = torch.constant.int 100 %7400 = torch.prim.ListConstruct %int-1_9713, %int26_9714, %int2_9715, %int16_9716, %int32_9717, %int100_9718 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7401 = torch.aten.view %7399, %7400 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_9719 = torch.constant.int 0 %int2_9720 = torch.constant.int 2 %7402 = torch.aten.select.int %7343, %int0_9719, %int2_9720 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_9721 = torch.constant.int 0 %int2_9722 = torch.constant.int 2 %7403 = torch.aten.select.int %arg3, %int0_9721, %int2_9722 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_9723 = torch.constant.int 0 %int0_9724 = torch.constant.int 0 %int9223372036854775807_9725 = torch.constant.int 9223372036854775807 %int1_9726 = torch.constant.int 1 %7404 = torch.aten.slice.Tensor %7403, %int0_9723, %int0_9724, %int9223372036854775807_9725, %int1_9726 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_9727 = torch.constant.int 16 %7405 = torch.aten.floor_divide.Scalar %7402, %int16_9727 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_9728 = torch.constant.int 0 %7406 = torch.aten.index_select %7404, %int0_9728, %7405 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_9729 = torch.constant.int 16 %7407 = torch.aten.remainder.Scalar %7402, %int16_9729 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_9730 = torch.constant.none %7408 = torch.aten.clone %646, %none_9730 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9731 = torch.constant.none %7409 = torch.aten.clone %647, %none_9731 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9732 = torch.constant.int 0 %7410 = torch.aten.unsqueeze %7407, %int0_9732 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9733 = torch.constant.int 0 %int2_9734 = torch.constant.int 2 %7411 = torch.aten.select.int %7342, %int0_9733, %int2_9734 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9735 = torch.constant.int 0 %int0_9736 = torch.constant.int 0 %7412 = torch.aten.select.int %7411, %int0_9735, %int0_9736 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7413 = torch.prim.ListConstruct %7406, %7408, %7409, %7410 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9737 = torch.constant.bool false %7414 = torch.aten.index_put %7401, %7413, %7412, %false_9737 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9738 = torch.constant.int 2662400 %7415 = torch.prim.ListConstruct %731, %int2662400_9738 : (!torch.int, !torch.int) -> !torch.list %7416 = torch.aten.view %7414, %7415 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9739 = torch.constant.int -1 %int26_9740 = torch.constant.int 26 %int2_9741 = torch.constant.int 2 %int16_9742 = torch.constant.int 16 %int32_9743 = torch.constant.int 32 %int100_9744 = torch.constant.int 100 %7417 = torch.prim.ListConstruct %int-1_9739, %int26_9740, %int2_9741, %int16_9742, %int32_9743, %int100_9744 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7418 = torch.aten.view %7416, %7417 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_9745 = torch.constant.none %7419 = torch.aten.clone %648, %none_9745 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9746 = torch.constant.none %7420 = torch.aten.clone %649, %none_9746 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9747 = torch.constant.int 0 %7421 = torch.aten.unsqueeze %7407, %int0_9747 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9748 = torch.constant.int 0 %int2_9749 = torch.constant.int 2 %7422 = torch.aten.select.int %7328, %int0_9748, %int2_9749 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9750 = torch.constant.int 0 %int0_9751 = torch.constant.int 0 %7423 = torch.aten.select.int %7422, %int0_9750, %int0_9751 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7424 = torch.prim.ListConstruct %7406, %7419, %7420, %7421 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9752 = torch.constant.bool false %7425 = torch.aten.index_put %7418, %7424, %7423, %false_9752 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9753 = torch.constant.int 2662400 %7426 = torch.prim.ListConstruct %731, %int2662400_9753 : (!torch.int, !torch.int) -> !torch.list %7427 = torch.aten.view %7425, %7426 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9754 = torch.constant.int -1 %int26_9755 = torch.constant.int 26 %int2_9756 = torch.constant.int 2 %int16_9757 = torch.constant.int 16 %int32_9758 = torch.constant.int 32 %int100_9759 = torch.constant.int 100 %7428 = torch.prim.ListConstruct %int-1_9754, %int26_9755, %int2_9756, %int16_9757, %int32_9758, %int100_9759 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7429 = torch.aten.view %7427, %7428 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int0_9760 = torch.constant.int 0 %int3_9761 = torch.constant.int 3 %7430 = torch.aten.select.int %7343, %int0_9760, %int3_9761 : !torch.vtensor<[4],si64>, !torch.int, !torch.int -> !torch.vtensor<[],si64> %int0_9762 = torch.constant.int 0 %int3_9763 = torch.constant.int 3 %7431 = torch.aten.select.int %arg3, %int0_9762, %int3_9763 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int0_9764 = torch.constant.int 0 %int0_9765 = torch.constant.int 0 %int9223372036854775807_9766 = torch.constant.int 9223372036854775807 %int1_9767 = torch.constant.int 1 %7432 = torch.aten.slice.Tensor %7431, %int0_9764, %int0_9765, %int9223372036854775807_9766, %int1_9767 : !torch.vtensor<[?],si64>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[?],si64> %int16_9768 = torch.constant.int 16 %7433 = torch.aten.floor_divide.Scalar %7430, %int16_9768 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %int0_9769 = torch.constant.int 0 %7434 = torch.aten.index_select %7432, %int0_9769, %7433 : !torch.vtensor<[?],si64>, !torch.int, !torch.vtensor<[],si64> -> !torch.vtensor<[1],si64> %int16_9770 = torch.constant.int 16 %7435 = torch.aten.remainder.Scalar %7430, %int16_9770 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[],si64> %none_9771 = torch.constant.none %7436 = torch.aten.clone %650, %none_9771 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9772 = torch.constant.none %7437 = torch.aten.clone %651, %none_9772 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9773 = torch.constant.int 0 %7438 = torch.aten.unsqueeze %7435, %int0_9773 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9774 = torch.constant.int 0 %int3_9775 = torch.constant.int 3 %7439 = torch.aten.select.int %7342, %int0_9774, %int3_9775 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9776 = torch.constant.int 0 %int0_9777 = torch.constant.int 0 %7440 = torch.aten.select.int %7439, %int0_9776, %int0_9777 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7441 = torch.prim.ListConstruct %7434, %7436, %7437, %7438 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9778 = torch.constant.bool false %7442 = torch.aten.index_put %7429, %7441, %7440, %false_9778 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9779 = torch.constant.int 2662400 %7443 = torch.prim.ListConstruct %731, %int2662400_9779 : (!torch.int, !torch.int) -> !torch.list %7444 = torch.aten.view %7442, %7443 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> %int-1_9780 = torch.constant.int -1 %int26_9781 = torch.constant.int 26 %int2_9782 = torch.constant.int 2 %int16_9783 = torch.constant.int 16 %int32_9784 = torch.constant.int 32 %int100_9785 = torch.constant.int 100 %7445 = torch.prim.ListConstruct %int-1_9780, %int26_9781, %int2_9782, %int16_9783, %int32_9784, %int100_9785 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7446 = torch.aten.view %7444, %7445 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %none_9786 = torch.constant.none %7447 = torch.aten.clone %652, %none_9786 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %none_9787 = torch.constant.none %7448 = torch.aten.clone %653, %none_9787 : !torch.vtensor<[1],si64>, !torch.none -> !torch.vtensor<[1],si64> %int0_9788 = torch.constant.int 0 %7449 = torch.aten.unsqueeze %7435, %int0_9788 : !torch.vtensor<[],si64>, !torch.int -> !torch.vtensor<[1],si64> %int0_9789 = torch.constant.int 0 %int3_9790 = torch.constant.int 3 %7450 = torch.aten.select.int %7328, %int0_9789, %int3_9790 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[1,32,100],f32> %int0_9791 = torch.constant.int 0 %int0_9792 = torch.constant.int 0 %7451 = torch.aten.select.int %7450, %int0_9791, %int0_9792 : !torch.vtensor<[1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[32,100],f32> %7452 = torch.prim.ListConstruct %7434, %7447, %7448, %7449 : (!torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>, !torch.vtensor<[1],si64>) -> !torch.list> %false_9793 = torch.constant.bool false %7453 = torch.aten.index_put %7446, %7452, %7451, %false_9793 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list>, !torch.vtensor<[32,100],f32>, !torch.bool -> !torch.vtensor<[?,26,2,16,32,100],f32> %int2662400_9794 = torch.constant.int 2662400 %7454 = torch.prim.ListConstruct %731, %int2662400_9794 : (!torch.int, !torch.int) -> !torch.list %7455 = torch.aten.view %7453, %7454 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,2662400],f32> torch.overwrite.tensor.contents %7455 overwrites %arg4 : !torch.vtensor<[?,2662400],f32>, !torch.tensor<[?,2662400],f32> %int52_9795 = torch.constant.int 52 %7456 = torch.aten.mul.Scalar %arg3, %int52_9795 : !torch.vtensor<[4,?],si64>, !torch.int -> !torch.vtensor<[4,?],si64> %int50 = torch.constant.int 50 %int1_9796 = torch.constant.int 1 %7457 = torch.aten.add.Scalar %7456, %int50, %int1_9796 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_9797 = torch.constant.int 4 %7458 = torch.aten.mul.int %int4_9797, %655 : !torch.int, !torch.int -> !torch.int %7459 = torch.prim.ListConstruct %7458 : (!torch.int) -> !torch.list %7460 = torch.aten.view %7457, %7459 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int-1_9798 = torch.constant.int -1 %int26_9799 = torch.constant.int 26 %int2_9800 = torch.constant.int 2 %int16_9801 = torch.constant.int 16 %int32_9802 = torch.constant.int 32 %int100_9803 = torch.constant.int 100 %7461 = torch.prim.ListConstruct %int-1_9798, %int26_9799, %int2_9800, %int16_9801, %int32_9802, %int100_9803 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7462 = torch.aten.view %7455, %7461 : !torch.vtensor<[?,2662400],f32>, !torch.list -> !torch.vtensor<[?,26,2,16,32,100],f32> %int26_9804 = torch.constant.int 26 %7463 = torch.aten.mul.int %731, %int26_9804 : !torch.int, !torch.int -> !torch.int %int2_9805 = torch.constant.int 2 %7464 = torch.aten.mul.int %7463, %int2_9805 : !torch.int, !torch.int -> !torch.int %int16_9806 = torch.constant.int 16 %int32_9807 = torch.constant.int 32 %int100_9808 = torch.constant.int 100 %7465 = torch.prim.ListConstruct %7464, %int16_9806, %int32_9807, %int100_9808 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7466 = torch.aten.view %7462, %7465 : !torch.vtensor<[?,26,2,16,32,100],f32>, !torch.list -> !torch.vtensor<[?,16,32,100],f32> %int0_9809 = torch.constant.int 0 %7467 = torch.aten.index_select %7466, %int0_9809, %7460 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_9810 = torch.constant.int 4 %int16_9811 = torch.constant.int 16 %int32_9812 = torch.constant.int 32 %int100_9813 = torch.constant.int 100 %7468 = torch.prim.ListConstruct %int4_9810, %655, %int16_9811, %int32_9812, %int100_9813 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7469 = torch.aten.view %7467, %7468 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_9814 = torch.constant.int 1 %7470 = torch.aten.size.int %7469, %int1_9814 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_9815 = torch.constant.int 16 %7471 = torch.aten.mul.int %7470, %int16_9815 : !torch.int, !torch.int -> !torch.int %int4_9816 = torch.constant.int 4 %int32_9817 = torch.constant.int 32 %int100_9818 = torch.constant.int 100 %7472 = torch.prim.ListConstruct %int4_9816, %7471, %int32_9817, %int100_9818 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7473 = torch.aten.view %7469, %7472 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_9819 = torch.constant.int 0 %int0_9820 = torch.constant.int 0 %int9223372036854775807_9821 = torch.constant.int 9223372036854775807 %int1_9822 = torch.constant.int 1 %7474 = torch.aten.slice.Tensor %7215, %int0_9819, %int0_9820, %int9223372036854775807_9821, %int1_9822 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int16_9823 = torch.constant.int 16 %7475 = torch.aten.mul.int %655, %int16_9823 : !torch.int, !torch.int -> !torch.int %int1_9824 = torch.constant.int 1 %int0_9825 = torch.constant.int 0 %int1_9826 = torch.constant.int 1 %7476 = torch.aten.slice.Tensor %7474, %int1_9824, %int0_9825, %7475, %int1_9826 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_9827 = torch.constant.bool false %7477 = torch.aten.copy %7476, %7473, %false_9827 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_9828 = torch.constant.int 0 %int0_9829 = torch.constant.int 0 %int9223372036854775807_9830 = torch.constant.int 9223372036854775807 %int1_9831 = torch.constant.int 1 %7478 = torch.aten.slice.Tensor %7215, %int0_9828, %int0_9829, %int9223372036854775807_9830, %int1_9831 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9832 = torch.constant.int 1 %int0_9833 = torch.constant.int 0 %int1_9834 = torch.constant.int 1 %7479 = torch.aten.slice_scatter %7478, %7477, %int1_9832, %int0_9833, %7475, %int1_9834 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_9835 = torch.constant.int 0 %int0_9836 = torch.constant.int 0 %int9223372036854775807_9837 = torch.constant.int 9223372036854775807 %int1_9838 = torch.constant.int 1 %7480 = torch.aten.slice_scatter %7215, %7479, %int0_9835, %int0_9836, %int9223372036854775807_9837, %int1_9838 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9839 = torch.constant.int 1 %int1_9840 = torch.constant.int 1 %7481 = torch.aten.add.Scalar %7457, %int1_9839, %int1_9840 : !torch.vtensor<[4,?],si64>, !torch.int, !torch.int -> !torch.vtensor<[4,?],si64> %int4_9841 = torch.constant.int 4 %7482 = torch.aten.mul.int %int4_9841, %655 : !torch.int, !torch.int -> !torch.int %7483 = torch.prim.ListConstruct %7482 : (!torch.int) -> !torch.list %7484 = torch.aten.view %7481, %7483 : !torch.vtensor<[4,?],si64>, !torch.list -> !torch.vtensor<[?],si64> %int0_9842 = torch.constant.int 0 %7485 = torch.aten.index_select %7466, %int0_9842, %7484 : !torch.vtensor<[?,16,32,100],f32>, !torch.int, !torch.vtensor<[?],si64> -> !torch.vtensor<[?,16,32,100],f32> %int4_9843 = torch.constant.int 4 %int16_9844 = torch.constant.int 16 %int32_9845 = torch.constant.int 32 %int100_9846 = torch.constant.int 100 %7486 = torch.prim.ListConstruct %int4_9843, %655, %int16_9844, %int32_9845, %int100_9846 : (!torch.int, !torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7487 = torch.aten.view %7485, %7486 : !torch.vtensor<[?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,16,32,100],f32> %int1_9847 = torch.constant.int 1 %7488 = torch.aten.size.int %7487, %int1_9847 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.int -> !torch.int %int16_9848 = torch.constant.int 16 %7489 = torch.aten.mul.int %7488, %int16_9848 : !torch.int, !torch.int -> !torch.int %int4_9849 = torch.constant.int 4 %int32_9850 = torch.constant.int 32 %int100_9851 = torch.constant.int 100 %7490 = torch.prim.ListConstruct %int4_9849, %7489, %int32_9850, %int100_9851 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7491 = torch.aten.view %7487, %7490 : !torch.vtensor<[4,?,16,32,100],f32>, !torch.list -> !torch.vtensor<[4,?,32,100],f32> %int0_9852 = torch.constant.int 0 %int0_9853 = torch.constant.int 0 %int9223372036854775807_9854 = torch.constant.int 9223372036854775807 %int1_9855 = torch.constant.int 1 %7492 = torch.aten.slice.Tensor %7232, %int0_9852, %int0_9853, %int9223372036854775807_9854, %int1_9855 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9856 = torch.constant.int 1 %int0_9857 = torch.constant.int 0 %int1_9858 = torch.constant.int 1 %7493 = torch.aten.slice.Tensor %7492, %int1_9856, %int0_9857, %7475, %int1_9858 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %false_9859 = torch.constant.bool false %7494 = torch.aten.copy %7493, %7491, %false_9859 : !torch.vtensor<[4,?,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.bool -> !torch.vtensor<[4,?,32,100],f32> %int0_9860 = torch.constant.int 0 %int0_9861 = torch.constant.int 0 %int9223372036854775807_9862 = torch.constant.int 9223372036854775807 %int1_9863 = torch.constant.int 1 %7495 = torch.aten.slice.Tensor %7232, %int0_9860, %int0_9861, %int9223372036854775807_9862, %int1_9863 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9864 = torch.constant.int 1 %int0_9865 = torch.constant.int 0 %int1_9866 = torch.constant.int 1 %7496 = torch.aten.slice_scatter %7495, %7494, %int1_9864, %int0_9865, %7475, %int1_9866 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_9867 = torch.constant.int 0 %int0_9868 = torch.constant.int 0 %int9223372036854775807_9869 = torch.constant.int 9223372036854775807 %int1_9870 = torch.constant.int 1 %7497 = torch.aten.slice_scatter %7232, %7496, %int0_9867, %int0_9868, %int9223372036854775807_9869, %int1_9870 : !torch.vtensor<[4,2048,32,100],f32>, !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int0_9871 = torch.constant.int 0 %int0_9872 = torch.constant.int 0 %int9223372036854775807_9873 = torch.constant.int 9223372036854775807 %int1_9874 = torch.constant.int 1 %7498 = torch.aten.slice.Tensor %671, %int0_9871, %int0_9872, %int9223372036854775807_9873, %int1_9874 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9875 = torch.constant.int 1 %int0_9876 = torch.constant.int 0 %int1_9877 = torch.constant.int 1 %7499 = torch.aten.slice.Tensor %7498, %int1_9875, %int0_9876, %7475, %int1_9877 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int0_9878 = torch.constant.int 0 %int0_9879 = torch.constant.int 0 %int9223372036854775807_9880 = torch.constant.int 9223372036854775807 %int1_9881 = torch.constant.int 1 %7500 = torch.aten.slice.Tensor %673, %int0_9878, %int0_9879, %int9223372036854775807_9880, %int1_9881 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9882 = torch.constant.int 1 %int0_9883 = torch.constant.int 0 %int1_9884 = torch.constant.int 1 %7501 = torch.aten.slice.Tensor %7500, %int1_9882, %int0_9883, %7475, %int1_9884 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_9885 = torch.constant.int 1 %int2_9886 = torch.constant.int 2 %7502 = torch.aten.transpose.int %7338, %int1_9885, %int2_9886 : !torch.vtensor<[4,1,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,1,100],f32> %int4_9887 = torch.constant.int 4 %int32_9888 = torch.constant.int 32 %int1_9889 = torch.constant.int 1 %int100_9890 = torch.constant.int 100 %7503 = torch.prim.ListConstruct %int4_9887, %int32_9888, %int1_9889, %int100_9890 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9891 = torch.constant.bool false %7504 = torch.aten.expand %7502, %7503, %false_9891 : !torch.vtensor<[4,32,1,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,100],f32> %int128_9892 = torch.constant.int 128 %int1_9893 = torch.constant.int 1 %int100_9894 = torch.constant.int 100 %7505 = torch.prim.ListConstruct %int128_9892, %int1_9893, %int100_9894 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7506 = torch.aten.view %7504, %7505 : !torch.vtensor<[4,32,1,100],f32>, !torch.list -> !torch.vtensor<[128,1,100],f32> %int0_9895 = torch.constant.int 0 %int0_9896 = torch.constant.int 0 %int9223372036854775807_9897 = torch.constant.int 9223372036854775807 %int1_9898 = torch.constant.int 1 %7507 = torch.aten.slice.Tensor %7480, %int0_9895, %int0_9896, %int9223372036854775807_9897, %int1_9898 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9899 = torch.constant.int 1 %int0_9900 = torch.constant.int 0 %int1_9901 = torch.constant.int 1 %7508 = torch.aten.slice.Tensor %7507, %int1_9899, %int0_9900, %7475, %int1_9901 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_9902 = torch.constant.int 1 %int2_9903 = torch.constant.int 2 %7509 = torch.aten.transpose.int %7508, %int1_9902, %int2_9903 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int2_9904 = torch.constant.int 2 %int3_9905 = torch.constant.int 3 %7510 = torch.aten.transpose.int %7509, %int2_9904, %int3_9905 : !torch.vtensor<[4,32,?,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int1_9906 = torch.constant.int 1 %7511 = torch.aten.size.int %7499, %int1_9906 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_9907 = torch.constant.int 4 %int32_9908 = torch.constant.int 32 %int100_9909 = torch.constant.int 100 %7512 = torch.prim.ListConstruct %int4_9907, %int32_9908, %int100_9909, %7511 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9910 = torch.constant.bool false %7513 = torch.aten.expand %7510, %7512, %false_9910 : !torch.vtensor<[4,32,100,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,100,?],f32> %int0_9911 = torch.constant.int 0 %7514 = torch.aten.clone %7513, %int0_9911 : !torch.vtensor<[4,32,100,?],f32>, !torch.int -> !torch.vtensor<[4,32,100,?],f32> %int128_9912 = torch.constant.int 128 %int100_9913 = torch.constant.int 100 %7515 = torch.prim.ListConstruct %int128_9912, %int100_9913, %7511 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7516 = torch.aten._unsafe_view %7514, %7515 : !torch.vtensor<[4,32,100,?],f32>, !torch.list -> !torch.vtensor<[128,100,?],f32> %7517 = torch.aten.bmm %7506, %7516 : !torch.vtensor<[128,1,100],f32>, !torch.vtensor<[128,100,?],f32> -> !torch.vtensor<[128,1,?],f32> %int4_9914 = torch.constant.int 4 %int32_9915 = torch.constant.int 32 %int1_9916 = torch.constant.int 1 %7518 = torch.prim.ListConstruct %int4_9914, %int32_9915, %int1_9916, %7511 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7519 = torch.aten.view %7517, %7518 : !torch.vtensor<[128,1,?],f32>, !torch.list -> !torch.vtensor<[4,32,1,?],f32> %float1.000000e01_9917 = torch.constant.float 1.000000e+01 %7520 = torch.aten.div.Scalar %7519, %float1.000000e01_9917 : !torch.vtensor<[4,32,1,?],f32>, !torch.float -> !torch.vtensor<[4,32,1,?],f32> %int1_9918 = torch.constant.int 1 %7521 = torch.aten.add.Tensor %7520, %895, %int1_9918 : !torch.vtensor<[4,32,1,?],f32>, !torch.vtensor<[4,1,1,?],f32>, !torch.int -> !torch.vtensor<[4,32,1,?],f32> %int-1_9919 = torch.constant.int -1 %false_9920 = torch.constant.bool false %7522 = torch.aten._softmax %7521, %int-1_9919, %false_9920 : !torch.vtensor<[4,32,1,?],f32>, !torch.int, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int4_9921 = torch.constant.int 4 %int32_9922 = torch.constant.int 32 %int1_9923 = torch.constant.int 1 %7523 = torch.prim.ListConstruct %int4_9921, %int32_9922, %int1_9923, %7511 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9924 = torch.constant.bool false %7524 = torch.aten.expand %7522, %7523, %false_9924 : !torch.vtensor<[4,32,1,?],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,1,?],f32> %int128_9925 = torch.constant.int 128 %int1_9926 = torch.constant.int 1 %7525 = torch.prim.ListConstruct %int128_9925, %int1_9926, %7511 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7526 = torch.aten.view %7524, %7525 : !torch.vtensor<[4,32,1,?],f32>, !torch.list -> !torch.vtensor<[128,1,?],f32> %int0_9927 = torch.constant.int 0 %int0_9928 = torch.constant.int 0 %int9223372036854775807_9929 = torch.constant.int 9223372036854775807 %int1_9930 = torch.constant.int 1 %7527 = torch.aten.slice.Tensor %7497, %int0_9927, %int0_9928, %int9223372036854775807_9929, %int1_9930 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,2048,32,100],f32> %int1_9931 = torch.constant.int 1 %int0_9932 = torch.constant.int 0 %int1_9933 = torch.constant.int 1 %7528 = torch.aten.slice.Tensor %7527, %int1_9931, %int0_9932, %7475, %int1_9933 : !torch.vtensor<[4,2048,32,100],f32>, !torch.int, !torch.int, !torch.int, !torch.int -> !torch.vtensor<[4,?,32,100],f32> %int1_9934 = torch.constant.int 1 %int2_9935 = torch.constant.int 2 %7529 = torch.aten.transpose.int %7528, %int1_9934, %int2_9935 : !torch.vtensor<[4,?,32,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int1_9936 = torch.constant.int 1 %7530 = torch.aten.size.int %7501, %int1_9936 : !torch.vtensor<[4,?,32,100],f32>, !torch.int -> !torch.int %int4_9937 = torch.constant.int 4 %int32_9938 = torch.constant.int 32 %int100_9939 = torch.constant.int 100 %7531 = torch.prim.ListConstruct %int4_9937, %int32_9938, %7530, %int100_9939 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %false_9940 = torch.constant.bool false %7532 = torch.aten.expand %7529, %7531, %false_9940 : !torch.vtensor<[4,32,?,100],f32>, !torch.list, !torch.bool -> !torch.vtensor<[4,32,?,100],f32> %int0_9941 = torch.constant.int 0 %7533 = torch.aten.clone %7532, %int0_9941 : !torch.vtensor<[4,32,?,100],f32>, !torch.int -> !torch.vtensor<[4,32,?,100],f32> %int128_9942 = torch.constant.int 128 %int100_9943 = torch.constant.int 100 %7534 = torch.prim.ListConstruct %int128_9942, %7530, %int100_9943 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7535 = torch.aten._unsafe_view %7533, %7534 : !torch.vtensor<[4,32,?,100],f32>, !torch.list -> !torch.vtensor<[128,?,100],f32> %7536 = torch.aten.bmm %7526, %7535 : !torch.vtensor<[128,1,?],f32>, !torch.vtensor<[128,?,100],f32> -> !torch.vtensor<[128,1,100],f32> %int4_9944 = torch.constant.int 4 %int32_9945 = torch.constant.int 32 %int1_9946 = torch.constant.int 1 %int100_9947 = torch.constant.int 100 %7537 = torch.prim.ListConstruct %int4_9944, %int32_9945, %int1_9946, %int100_9947 : (!torch.int, !torch.int, !torch.int, !torch.int) -> !torch.list %7538 = torch.aten.view %7536, %7537 : !torch.vtensor<[128,1,100],f32>, !torch.list -> !torch.vtensor<[4,32,1,100],f32> %int1_9948 = torch.constant.int 1 %int2_9949 = torch.constant.int 2 %7539 = torch.aten.transpose.int %7538, %int1_9948, %int2_9949 : !torch.vtensor<[4,32,1,100],f32>, !torch.int, !torch.int -> !torch.vtensor<[4,1,32,100],f32> %int4_9950 = torch.constant.int 4 %int1_9951 = torch.constant.int 1 %int-1_9952 = torch.constant.int -1 %7540 = torch.prim.ListConstruct %int4_9950, %int1_9951, %int-1_9952 : (!torch.int, !torch.int, !torch.int) -> !torch.list %7541 = torch.aten.view %7539, %7540 : !torch.vtensor<[4,1,32,100],f32>, !torch.list -> !torch.vtensor<[4,1,3200],f32> %7542 = torch_c.to_builtin_tensor %7541 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9953 = tensor.cast %7542 : tensor<4x1x3200xf32> to tensor %7543 = torch_c.to_builtin_tensor %231 : !torch.vtensor<[3200,3200],f16> -> tensor<3200x3200xf16> %7544 = util.call @sharktank_mmtfp_3d_3200_3200_f32f16f32(%cast_9953, %7543) : (tensor, tensor<3200x3200xf16>) -> tensor %cast_9954 = tensor.cast %7544 : tensor to tensor<4x1x3200xf32> %7545 = torch_c.from_builtin_tensor %cast_9954 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_9955 = torch.constant.int 1 %7546 = torch.aten.add.Tensor %7303, %7545, %int1_9955 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_9956 = torch.constant.int 2 %7547 = torch.aten.pow.Tensor_Scalar %7546, %int2_9956 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_9957 = torch.constant.int -1 %7548 = torch.prim.ListConstruct %int-1_9957 : (!torch.int) -> !torch.list %true_9958 = torch.constant.bool true %none_9959 = torch.constant.none %7549 = torch.aten.mean.dim %7547, %7548, %true_9958, %none_9959 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_9960 = torch.constant.float 9.9999999747524271E-7 %int1_9961 = torch.constant.int 1 %7550 = torch.aten.add.Scalar %7549, %float9.999990e-07_9960, %int1_9961 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %7551 = torch.aten.rsqrt %7550 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %7552 = torch.aten.mul.Tensor %7546, %7551 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %7553 = torch.aten.mul.Tensor %7552, %232 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %7554 = torch_c.to_builtin_tensor %7553 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9962 = tensor.cast %7554 : tensor<4x1x3200xf32> to tensor %7555 = torch_c.to_builtin_tensor %233 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %7556 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_9962, %7555) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_9963 = tensor.cast %7556 : tensor to tensor<4x1x8640xf32> %7557 = torch_c.from_builtin_tensor %cast_9963 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %7558 = torch.aten.silu %7557 : !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %7559 = torch_c.to_builtin_tensor %7553 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9964 = tensor.cast %7559 : tensor<4x1x3200xf32> to tensor %7560 = torch_c.to_builtin_tensor %234 : !torch.vtensor<[8640,3200],f16> -> tensor<8640x3200xf16> %7561 = util.call @sharktank_mmtfp_3d_8640_3200_f32f16f32(%cast_9964, %7560) : (tensor, tensor<8640x3200xf16>) -> tensor %cast_9965 = tensor.cast %7561 : tensor to tensor<4x1x8640xf32> %7562 = torch_c.from_builtin_tensor %cast_9965 : tensor<4x1x8640xf32> -> !torch.vtensor<[4,1,8640],f32> %7563 = torch.aten.mul.Tensor %7558, %7562 : !torch.vtensor<[4,1,8640],f32>, !torch.vtensor<[4,1,8640],f32> -> !torch.vtensor<[4,1,8640],f32> %7564 = torch_c.to_builtin_tensor %7563 : !torch.vtensor<[4,1,8640],f32> -> tensor<4x1x8640xf32> %cast_9966 = tensor.cast %7564 : tensor<4x1x8640xf32> to tensor %7565 = torch_c.to_builtin_tensor %235 : !torch.vtensor<[3200,8640],f16> -> tensor<3200x8640xf16> %7566 = util.call @sharktank_mmtfp_3d_3200_8640_f32f16f32(%cast_9966, %7565) : (tensor, tensor<3200x8640xf16>) -> tensor %cast_9967 = tensor.cast %7566 : tensor to tensor<4x1x3200xf32> %7567 = torch_c.from_builtin_tensor %cast_9967 : tensor<4x1x3200xf32> -> !torch.vtensor<[4,1,3200],f32> %int1_9968 = torch.constant.int 1 %7568 = torch.aten.add.Tensor %7546, %7567, %int1_9968 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int2_9969 = torch.constant.int 2 %7569 = torch.aten.pow.Tensor_Scalar %7568, %int2_9969 : !torch.vtensor<[4,1,3200],f32>, !torch.int -> !torch.vtensor<[4,1,3200],f32> %int-1_9970 = torch.constant.int -1 %7570 = torch.prim.ListConstruct %int-1_9970 : (!torch.int) -> !torch.list %true_9971 = torch.constant.bool true %none_9972 = torch.constant.none %7571 = torch.aten.mean.dim %7569, %7570, %true_9971, %none_9972 : !torch.vtensor<[4,1,3200],f32>, !torch.list, !torch.bool, !torch.none -> !torch.vtensor<[4,1,1],f32> %float9.999990e-07_9973 = torch.constant.float 9.9999999747524271E-7 %int1_9974 = torch.constant.int 1 %7572 = torch.aten.add.Scalar %7571, %float9.999990e-07_9973, %int1_9974 : !torch.vtensor<[4,1,1],f32>, !torch.float, !torch.int -> !torch.vtensor<[4,1,1],f32> %7573 = torch.aten.rsqrt %7572 : !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,1],f32> %7574 = torch.aten.mul.Tensor %7568, %7573 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[4,1,1],f32> -> !torch.vtensor<[4,1,3200],f32> %7575 = torch.aten.mul.Tensor %7574, %236 : !torch.vtensor<[4,1,3200],f32>, !torch.vtensor<[3200],f32> -> !torch.vtensor<[4,1,3200],f32> %7576 = torch_c.to_builtin_tensor %7575 : !torch.vtensor<[4,1,3200],f32> -> tensor<4x1x3200xf32> %cast_9975 = tensor.cast %7576 : tensor<4x1x3200xf32> to tensor %7577 = torch_c.to_builtin_tensor %237 : !torch.vtensor<[32000,3200],f16> -> tensor<32000x3200xf16> %7578 = util.call @sharktank_mmtfp_3d_32000_3200_f32f16f32(%cast_9975, %7577) : (tensor, tensor<32000x3200xf16>) -> tensor %cast_9976 = tensor.cast %7578 : tensor to tensor<4x1x32000xf32> %7579 = torch_c.from_builtin_tensor %cast_9976 : tensor<4x1x32000xf32> -> !torch.vtensor<[4,1,32000],f32> return %7579 : !torch.vtensor<[4,1,32000],f32> } util.func private @sharktank_mmtfp_3d_3200_3200_f32f16f32(%arg0: tensor, %arg1: tensor<3200x3200xf16>) -> tensor { %cst = arith.constant 0.000000e+00 : f32 %c0 = arith.constant 0 : index %c1 = arith.constant 1 : index %dim = tensor.dim %arg0, %c0 : tensor %dim_0 = tensor.dim %arg0, %c1 : tensor %0 = tensor.empty(%dim) : tensor %1 = linalg.generic {indexing_maps = [#map, #map1], iterator_types = ["parallel", "parallel", "parallel"]} ins(%arg1 : tensor<3200x3200xf16>) outs(%0 : tensor) { ^bb0(%in: f16, %out: f16): linalg.yield %in : f16 } -> tensor %2 = tensor.empty(%dim, %dim_0) : tensor %3 = linalg.fill ins(%cst : f32) outs(%2 : tensor) -> tensor %4 = linalg.batch_matmul_transpose_b ins(%arg0, %1 : tensor, tensor) outs(%3 : tensor) -> tensor %5 = tensor.empty(%dim, %dim_0) : tensor %6 = linalg.copy ins(%4 : tensor) outs(%5 : tensor) -> tensor util.return %6 : tensor } util.func private @sharktank_mmtfp_3d_8640_3200_f32f16f32(%arg0: tensor, %arg1: tensor<8640x3200xf16>) -> tensor { %cst = arith.constant 0.000000e+00 : f32 %c0 = arith.constant 0 : index %c1 = arith.constant 1 : index %dim = tensor.dim %arg0, %c0 : tensor %dim_0 = tensor.dim %arg0, %c1 : tensor %0 = tensor.empty(%dim) : tensor %1 = linalg.generic {indexing_maps = [#map, #map1], iterator_types = ["parallel", "parallel", "parallel"]} ins(%arg1 : tensor<8640x3200xf16>) outs(%0 : tensor) { ^bb0(%in: f16, %out: f16): linalg.yield %in : f16 } -> tensor %2 = tensor.empty(%dim, %dim_0) : tensor %3 = linalg.fill ins(%cst : f32) outs(%2 : tensor) -> tensor %4 = linalg.batch_matmul_transpose_b ins(%arg0, %1 : tensor, tensor) outs(%3 : tensor) -> tensor %5 = tensor.empty(%dim, %dim_0) : tensor %6 = linalg.copy ins(%4 : tensor) outs(%5 : tensor) -> tensor util.return %6 : tensor } util.func private @sharktank_mmtfp_3d_3200_8640_f32f16f32(%arg0: tensor, %arg1: tensor<3200x8640xf16>) -> tensor { %cst = arith.constant 0.000000e+00 : f32 %c0 = arith.constant 0 : index %c1 = arith.constant 1 : index %dim = tensor.dim %arg0, %c0 : tensor %dim_0 = tensor.dim %arg0, %c1 : tensor %0 = tensor.empty(%dim) : tensor %1 = linalg.generic {indexing_maps = [#map, #map1], iterator_types = ["parallel", "parallel", "parallel"]} ins(%arg1 : tensor<3200x8640xf16>) outs(%0 : tensor) { ^bb0(%in: f16, %out: f16): linalg.yield %in : f16 } -> tensor %2 = tensor.empty(%dim, %dim_0) : tensor %3 = linalg.fill ins(%cst : f32) outs(%2 : tensor) -> tensor %4 = linalg.batch_matmul_transpose_b ins(%arg0, %1 : tensor, tensor) outs(%3 : tensor) -> tensor %5 = tensor.empty(%dim, %dim_0) : tensor %6 = linalg.copy ins(%4 : tensor) outs(%5 : tensor) -> tensor util.return %6 : tensor } util.func private @sharktank_mmtfp_3d_32000_3200_f32f16f32(%arg0: tensor, %arg1: tensor<32000x3200xf16>) -> tensor { %cst = arith.constant 0.000000e+00 : f32 %c0 = arith.constant 0 : index %c1 = arith.constant 1 : index %dim = tensor.dim %arg0, %c0 : tensor %dim_0 = tensor.dim %arg0, %c1 : tensor %0 = tensor.empty(%dim) : tensor %1 = linalg.generic {indexing_maps = [#map, #map1], iterator_types = ["parallel", "parallel", "parallel"]} ins(%arg1 : tensor<32000x3200xf16>) outs(%0 : tensor) { ^bb0(%in: f16, %out: f16): linalg.yield %in : f16 } -> tensor %2 = tensor.empty(%dim, %dim_0) : tensor %3 = linalg.fill ins(%cst : f32) outs(%2 : tensor) -> tensor %4 = linalg.batch_matmul_transpose_b ins(%arg0, %1 : tensor, tensor) outs(%3 : tensor) -> tensor %5 = tensor.empty(%dim, %dim_0) : tensor %6 = linalg.copy ins(%4 : tensor) outs(%5 : tensor) -> tensor util.return %6 : tensor } } {-# dialect_resources: { builtin: { __auto.constant_2048_50_torch.complex64: "} } #-}